Advertisement
Guest User

Untitled

a guest
Jan 13th, 2017
138
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 13.06 KB | None | 0 0
  1. <?xml version="1.0" encoding="UTF-8"?>
  2. <!-- Solr managed schema - automatically generated - DO NOT EDIT -->
  3. <schema name="nutch" version="1.5">
  4. <uniqueKey>id</uniqueKey>
  5. <defaultSearchField>text</defaultSearchField>
  6. <solrQueryParser defaultOperator="OR"/>
  7. <fieldType name="binary" class="solr.BinaryField"/>
  8. <fieldType name="boolean" class="solr.BoolField" sortMissingLast="true"/>
  9. <fieldType name="booleans" class="solr.BoolField" sortMissingLast="true" multiValued="true"/>
  10. <fieldType name="date" class="solr.TrieDateField" omitNorms="true" positionIncrementGap="0" precisionStep="0"/>
  11. <fieldType name="double" class="solr.TrieDoubleField" omitNorms="true" positionIncrementGap="0" precisionStep="0"/>
  12. <fieldType name="float" class="solr.TrieFloatField" omitNorms="true" positionIncrementGap="0" precisionStep="0"/>
  13. <fieldType name="ignored" class="solr.StrField" indexed="false" stored="false" multiValued="true"/>
  14. <fieldType name="int" class="solr.TrieIntField" omitNorms="true" positionIncrementGap="0" precisionStep="0"/>
  15. <fieldType name="location" class="solr.LatLonType" subFieldSuffix="_coordinate"/>
  16. <fieldType name="long" class="solr.TrieLongField" omitNorms="true" positionIncrementGap="0" precisionStep="0"/>
  17. <fieldType name="lowercase" class="solr.TextField" positionIncrementGap="100">
  18. <analyzer>
  19. <tokenizer class="solr.KeywordTokenizerFactory"/>
  20. <filter class="solr.LowerCaseFilterFactory"/>
  21. </analyzer>
  22. </fieldType>
  23. <fieldType name="payloads" class="solr.TextField" indexed="true" stored="false">
  24. <analyzer>
  25. <tokenizer class="solr.WhitespaceTokenizerFactory"/>
  26. <filter class="solr.DelimitedPayloadTokenFilterFactory" encoder="float"/>
  27. </analyzer>
  28. </fieldType>
  29. <fieldType name="phonetic" class="solr.TextField" indexed="true" stored="false">
  30. <analyzer>
  31. <tokenizer class="solr.StandardTokenizerFactory"/>
  32. <filter class="solr.DoubleMetaphoneFilterFactory" inject="false"/>
  33. </analyzer>
  34. </fieldType>
  35. <fieldType name="string" class="solr.StrField" omitNorms="true" sortMissingLast="true"/>
  36. <fieldType name="strings" class="solr.StrField" sortMissingLast="true" multiValued="true"/>
  37. <fieldType name="tdate" class="solr.TrieDateField" omitNorms="true" positionIncrementGap="0" precisionStep="6"/>
  38. <fieldType name="tdates" class="solr.TrieDateField" positionIncrementGap="0" multiValued="true" precisionStep="6"/>
  39. <fieldType name="tdouble" class="solr.TrieDoubleField" omitNorms="true" positionIncrementGap="0" precisionStep="8"/>
  40. <fieldType name="tdoubles" class="solr.TrieDoubleField" positionIncrementGap="0" multiValued="true" precisionStep="8"/>
  41. <fieldType name="text_en" class="solr.TextField" positionIncrementGap="100">
  42. <analyzer type="index">
  43. <tokenizer class="solr.StandardTokenizerFactory"/>
  44. <filter class="solr.StopFilterFactory" words="stopwords.txt" ignoreCase="true"/>
  45. <filter class="solr.LowerCaseFilterFactory"/>
  46. <filter class="solr.EnglishPossessiveFilterFactory"/>
  47. <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
  48. <filter class="solr.PorterStemFilterFactory"/>
  49. </analyzer>
  50. <analyzer type="query">
  51. <tokenizer class="solr.StandardTokenizerFactory"/>
  52. <filter class="solr.SynonymFilterFactory" expand="true" ignoreCase="true" synonyms="synonyms.txt"/>
  53. <filter class="solr.StopFilterFactory" words="stopwords.txt" ignoreCase="true"/>
  54. <filter class="solr.LowerCaseFilterFactory"/>
  55. <filter class="solr.EnglishPossessiveFilterFactory"/>
  56. <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
  57. <filter class="solr.PorterStemFilterFactory"/>
  58. </analyzer>
  59. </fieldType>
  60. <fieldType name="text_en_splitting" class="solr.TextField" autoGeneratePhraseQueries="true" positionIncrementGap="100">
  61. <analyzer type="index">
  62. <tokenizer class="solr.WhitespaceTokenizerFactory"/>
  63. <filter class="solr.StopFilterFactory" words="stopwords.txt" ignoreCase="true"/>
  64. <filter class="solr.WordDelimiterFilterFactory" catenateNumbers="1" generateNumberParts="1" splitOnCaseChange="1" generateWordParts="1" catenateAll="0" catenateWords="1"/>
  65. <filter class="solr.LowerCaseFilterFactory"/>
  66. <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
  67. <filter class="solr.PorterStemFilterFactory"/>
  68. </analyzer>
  69. <analyzer type="query">
  70. <tokenizer class="solr.WhitespaceTokenizerFactory"/>
  71. <filter class="solr.SynonymFilterFactory" expand="true" ignoreCase="true" synonyms="synonyms.txt"/>
  72. <filter class="solr.StopFilterFactory" words="stopwords.txt" ignoreCase="true"/>
  73. <filter class="solr.WordDelimiterFilterFactory" catenateNumbers="0" generateNumberParts="1" splitOnCaseChange="1" generateWordParts="1" catenateAll="0" catenateWords="0"/>
  74. <filter class="solr.LowerCaseFilterFactory"/>
  75. <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
  76. <filter class="solr.PorterStemFilterFactory"/>
  77. </analyzer>
  78. </fieldType>
  79. <fieldType name="text_en_splitting_tight" class="solr.TextField" autoGeneratePhraseQueries="true" positionIncrementGap="100">
  80. <analyzer>
  81. <tokenizer class="solr.WhitespaceTokenizerFactory"/>
  82. <filter class="solr.SynonymFilterFactory" expand="false" ignoreCase="true" synonyms="synonyms.txt"/>
  83. <filter class="solr.StopFilterFactory" words="stopwords.txt" ignoreCase="true"/>
  84. <filter class="solr.WordDelimiterFilterFactory" catenateNumbers="1" generateNumberParts="0" generateWordParts="0" catenateAll="0" catenateWords="1"/>
  85. <filter class="solr.LowerCaseFilterFactory"/>
  86. <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
  87. <filter class="solr.EnglishMinimalStemFilterFactory"/>
  88. <filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
  89. </analyzer>
  90. </fieldType>
  91. <fieldType name="text_general" class="solr.TextField" positionIncrementGap="100">
  92. <analyzer type="index">
  93. <tokenizer class="solr.StandardTokenizerFactory"/>
  94. <filter class="solr.StopFilterFactory" words="stopwords.txt" ignoreCase="true"/>
  95. <filter class="solr.LowerCaseFilterFactory"/>
  96. </analyzer>
  97. <analyzer type="query">
  98. <tokenizer class="solr.StandardTokenizerFactory"/>
  99. <filter class="solr.StopFilterFactory" words="stopwords.txt" ignoreCase="true"/>
  100. <filter class="solr.SynonymFilterFactory" expand="true" ignoreCase="true" synonyms="synonyms.txt"/>
  101. <filter class="solr.LowerCaseFilterFactory"/>
  102. </analyzer>
  103. </fieldType>
  104. <fieldType name="text_general_rev" class="solr.TextField" positionIncrementGap="100">
  105. <analyzer type="index">
  106. <tokenizer class="solr.StandardTokenizerFactory"/>
  107. <filter class="solr.StopFilterFactory" words="stopwords.txt" ignoreCase="true"/>
  108. <filter class="solr.LowerCaseFilterFactory"/>
  109. <filter class="solr.ReversedWildcardFilterFactory" maxPosQuestion="2" maxFractionAsterisk="0.33" maxPosAsterisk="3" withOriginal="true"/>
  110. </analyzer>
  111. <analyzer type="query">
  112. <tokenizer class="solr.StandardTokenizerFactory"/>
  113. <filter class="solr.SynonymFilterFactory" expand="true" ignoreCase="true" synonyms="synonyms.txt"/>
  114. <filter class="solr.StopFilterFactory" words="stopwords.txt" ignoreCase="true"/>
  115. <filter class="solr.LowerCaseFilterFactory"/>
  116. </analyzer>
  117. </fieldType>
  118. <fieldType name="text_path" class="solr.TextField" positionIncrementGap="100">
  119. <analyzer>
  120. <tokenizer class="solr.PathHierarchyTokenizerFactory"/>
  121. </analyzer>
  122. </fieldType>
  123. <fieldType name="tfloat" class="solr.TrieFloatField" omitNorms="true" positionIncrementGap="0" precisionStep="8"/>
  124. <fieldType name="tint" class="solr.TrieIntField" omitNorms="true" positionIncrementGap="0" precisionStep="8"/>
  125. <fieldType name="tlong" class="solr.TrieLongField" omitNorms="true" positionIncrementGap="0" precisionStep="8"/>
  126. <fieldType name="tlongs" class="solr.TrieLongField" positionIncrementGap="0" multiValued="true" precisionStep="8"/>
  127. <fieldType name="url" class="solr.TextField" positionIncrementGap="100">
  128. <analyzer>
  129. <tokenizer class="solr.StandardTokenizerFactory"/>
  130. <filter class="solr.LowerCaseFilterFactory"/>
  131. <filter class="solr.WordDelimiterFilterFactory" generateNumberParts="1" generateWordParts="1"/>
  132. </analyzer>
  133. </fieldType>
  134. <field name="_version_" type="long" indexed="true" stored="true"/>
  135. <field name="accRadius" type="int" indexed="true" stored="true"/>
  136. <field name="anchor" type="text_general" multiValued="true" indexed="true" stored="true"/>
  137. <field name="author" type="string" indexed="true" stored="true"/>
  138. <field name="autonSystemNum" type="int" indexed="true" stored="true"/>
  139. <field name="autonSystemOrg" type="string" indexed="true" stored="true"/>
  140. <field name="binaryContent" type="binary" indexed="false" stored="true"/>
  141. <field name="boost" type="float" indexed="false" stored="true"/>
  142. <field name="cache" type="string" indexed="false" stored="true"/>
  143. <field name="cc" type="string" multiValued="true" indexed="true" stored="true"/>
  144. <field name="cityConfidence" type="int" indexed="true" stored="true"/>
  145. <field name="cityGeoNameId" type="int" indexed="true" stored="true"/>
  146. <field name="cityName" type="string" indexed="true" stored="true"/>
  147. <field name="connType" type="string" indexed="true" stored="true"/>
  148. <field name="content" type="text_en" indexed="true" stored="true"/>
  149. <field name="contentLength" type="string" indexed="false" stored="true"/>
  150. <field name="contentName" type="string" indexed="true" stored="true"/>
  151. <field name="continentCode" type="string" indexed="true" stored="true"/>
  152. <field name="continentGeoNameId" type="int" indexed="true" stored="true"/>
  153. <field name="countryConfidence" type="int" indexed="true" stored="true"/>
  154. <field name="countryGeoNameId" type="int" indexed="true" stored="true"/>
  155. <field name="countryIsoCode" type="string" indexed="true" stored="true"/>
  156. <field name="countryName" type="string" indexed="true" stored="true"/>
  157. <field name="countryType" type="string" indexed="true" stored="true"/>
  158. <field name="date" type="tdate" indexed="true" stored="true"/>
  159. <field name="digest" type="string" indexed="false" stored="true"/>
  160. <field name="domain" type="string" indexed="true" stored="true"/>
  161. <field name="feed" type="string" indexed="true" stored="true"/>
  162. <field name="host" type="url" indexed="true" stored="false"/>
  163. <field name="id" type="string" indexed="true" required="true" stored="true"/>
  164. <field name="ip" type="string" indexed="true" stored="true"/>
  165. <field name="isAnonProxy" type="boolean" indexed="true" stored="true"/>
  166. <field name="isSatelitteProv" type="boolean" indexed="true" stored="true"/>
  167. <field name="isp" type="string" indexed="true" stored="true"/>
  168. <field name="lang" type="string" indexed="true" stored="true"/>
  169. <field name="lastModified" type="date" indexed="true" stored="true"/>
  170. <field name="latLon" type="string" indexed="true" stored="true"/>
  171. <field name="location" type="location" indexed="true" stored="true"/>
  172. <field name="meta_description" type="strings"/>
  173. <field name="meta_keywords" type="strings"/>
  174. <field name="metroCode" type="int" indexed="true" stored="true"/>
  175. <field name="org" type="string" indexed="true" stored="true"/>
  176. <field name="postalCode" type="string" indexed="true" stored="true"/>
  177. <field name="postalConfidence" type="int" indexed="true" stored="true"/>
  178. <field name="publishedDate" type="date" indexed="true" stored="true"/>
  179. <field name="segment" type="string" indexed="false" stored="true"/>
  180. <field name="subDivConfidence" type="int" indexed="true" stored="true"/>
  181. <field name="subDivGeoNameId" type="int" indexed="true" stored="true"/>
  182. <field name="subDivIsoCode" type="string" indexed="true" stored="true"/>
  183. <field name="subDivName" type="string" indexed="true" stored="true"/>
  184. <field name="subcollection" type="string" multiValued="true" indexed="true" stored="true"/>
  185. <field name="tag" type="string" multiValued="true" indexed="true" stored="true"/>
  186. <field name="text" type="text_general" multiValued="true" indexed="true" stored="false"/>
  187. <field name="timeZone" type="string" indexed="true" stored="true"/>
  188. <field name="title" type="text_en" indexed="true" stored="true"/>
  189. <field name="tld" type="string" indexed="false" stored="false"/>
  190. <field name="tstamp" type="date" indexed="false" stored="true"/>
  191. <field name="type" type="string" multiValued="true" indexed="true" stored="true"/>
  192. <field name="updatedDate" type="date" indexed="true" stored="true"/>
  193. <field name="url" type="url" indexed="true" stored="true"/>
  194. <field name="userType" type="string" indexed="true" stored="true"/>
  195. <dynamicField name="*_coordinate" type="tdouble" indexed="true" stored="false"/>
  196. <copyField source="anchor" dest="text"/>
  197. <copyField source="author" dest="text"/>
  198. <copyField source="content" dest="text"/>
  199. <copyField source="latLon" dest="location"/>
  200. <copyField source="title" dest="text"/>
  201. <copyField source="url" dest="text"/>
  202. </schema>
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement