Advertisement
Guest User

Untitled

a guest
Mar 6th, 2019
93
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 7.30 KB | None | 0 0
  1. <?xml version="1.0" encoding="utf-8"?>
  2.  
  3. <dataConfig>
  4.  
  5. <dataSource type="JdbcDataSource"
  6. autoCommit="true" batchSize="-1"
  7. convertType="false"
  8. driver="com.mysql.jdbc.Driver"
  9. url="jdbc:mysql://127.0.0.1:3306/ktimatologio"
  10. user="root"
  11. password="********"
  12. name="db"/>
  13.  
  14. <dataSource name="fieldReader" type="FieldStreamDataSource" />
  15.  
  16. <document>
  17.  
  18. <entity name="aitiologikes_ektheseis"
  19. dataSource="db"
  20. transformer="HTMLStripTransformer"
  21. query="select id, title, title AS grid_title, model, type, url, last_modified, CONCAT_WS('_',id,model) AS solr_id, search_tag, CONCAT( body,' ',title) AS content from aitiologikes_ektheseis where type = 'text'"
  22. deltaImportQuery="select id, title, title AS grid_title, model, type, url, last_modified, CONCAT_WS('_',id,model) AS solr_id, search_tag, CONCAT( body,' ',title) AS content from aitiologikes_ektheseis where type = 'text' and id='${dataimporter.delta.id}'"
  23. deltaQuery="select id, title, title AS grid_title, model, type, url, last_modified, CONCAT_WS('_',id,model) AS solr_id, search_tag, CONCAT( body,' ',title) AS content from aitiologikes_ektheseis where type = 'text' and last_modified > '${dataimporter.last_index_time}'">
  24. <field column="id" name="ida" />
  25. <field column="solr_id" name="solr_id" />
  26. <field column="title" name="title" stripHTML="true" />
  27. <field column="grid_title" name="grid_title" stripHTML="true" />
  28. <field column="model" name="model" stripHTML="true" />
  29. <field column="type" name="type" stripHTML="true" />
  30. <field column="url" name="url" stripHTML="true" />
  31. <field column="last_modified" name="last_modified" stripHTML="true" />
  32. <field column="search_tag" name="search_tag" stripHTML="true" />
  33. <field column="content" name="content" stripHTML="true" />
  34. </entity>
  35.  
  36. <entity name="aitiologikes_ektheseis_bin"
  37. query="select id, title, title AS grid_title, model, type, url, last_modified, CONCAT_WS('_',id,model) AS solr_id, search_tag, bin_con AS text from aitiologikes_ektheseis where type = 'bin'"
  38. deltaImportQuery="select id, title, title AS grid_title, model, type, url, last_modified, CONCAT_WS('_',id,model) AS solr_id, search_tag, bin_con AS text from aitiologikes_ektheseis where type = 'bin' and id='${dataimporter.delta.id}'"
  39. deltaQuery="select id, title, title AS grid_title, model, type, url, last_modified, CONCAT_WS('_',id,model) AS solr_id, search_tag, bin_con AS text from aitiologikes_ektheseis where type = 'bin' and last_modified > '${dataimporter.last_index_time}'"
  40. transformer="TemplateTransformer"
  41. dataSource="db">
  42. <field column="id" name="ida" />
  43. <field column="solr_id" name="solr_id" />
  44. <field column="title" name="title" stripHTML="true" />
  45. <field column="grid_title" name="grid_title" stripHTML="true" />
  46. <field column="model" name="model" stripHTML="true" />
  47. <field column="type" name="type" stripHTML="true" />
  48. <field column="url" name="url" stripHTML="true" />
  49. <field column="last_modified" name="last_modified" stripHTML="true" />
  50. <field column="search_tag" name="search_tag" stripHTML="true" />
  51.  
  52. <entity dataSource="fieldReader" processor="TikaEntityProcessor" dataField="aitiologikes_ektheseis_bin.text" format="text">
  53. <field column="text" name="contentbin" stripHTML="true" />
  54. </entity>
  55.  
  56. </entity>
  57.  
  58. ...
  59. ...
  60. </document>
  61.  
  62. </dataConfig>
  63.  
  64. <fieldType name="text_ktimatologio" class="solr.TextField" positionIncrementGap="100">
  65.  
  66. <analyzer type="index">
  67. <tokenizer class="solr.StandardTokenizerFactory"/>
  68. <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_en.txt" enablePositionIncrements="true"/>
  69. <filter class="solr.LowerCaseFilterFactory"/>
  70. <filter class="solr.EnglishPossessiveFilterFactory"/>
  71. <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_el.txt" enablePositionIncrements="true"/>
  72. <filter class="solr.GreekLowerCaseFilterFactory"/>
  73. <filter class="solr.GreekStemFilterFactory"/>
  74. <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
  75. <filter class="solr.PorterStemFilterFactory"/>
  76. </analyzer>
  77.  
  78. <analyzer type="query">
  79. <tokenizer class="solr.StandardTokenizerFactory"/>
  80. <filter class="solr.SynonymFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="true"/>
  81. <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_en.txt" enablePositionIncrements="true"/>
  82. <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_el.txt" enablePositionIncrements="true"/>
  83. <filter class="solr.GreekLowerCaseFilterFactory"/>
  84. <filter class="solr.GreekStemFilterFactory"/>
  85. <filter class="solr.LowerCaseFilterFactory"/>
  86. <filter class="solr.EnglishPossessiveFilterFactory"/>
  87. <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
  88. <filter class="solr.PorterStemFilterFactory"/>
  89. </analyzer>
  90. </fieldType>
  91.  
  92. <fieldType name="text" class="solr.TextField" positionIncrementGap="100">
  93. <analyzer type="index">
  94. <charFilter class="solr.HTMLStripCharFilterFactory"/>
  95. <tokenizer class="solr.StandardTokenizerFactory"/>
  96. <filter class="solr.StandardFilterFactory"/>
  97. <filter class="solr.LowerCaseFilterFactory"/>
  98. <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_el.txt" enablePositionIncrements="true"/>
  99. <filter class="solr.GreekLowerCaseFilterFactory"/>
  100. <filter class="solr.GreekStemFilterFactory"/>
  101. <filter class="solr.HunspellStemFilterFactory" dictionary="dictionaries/el_GR.dic" affix="dictionaries/el_GR.aff" ignoreCase="true" />
  102. </analyzer>
  103.  
  104. <analyzer type="query">
  105. <charFilter class="solr.HTMLStripCharFilterFactory"/>
  106. <tokenizer class="solr.StandardTokenizerFactory"/>
  107. <filter class="solr.StandardFilterFactory"/>
  108. <filter class="solr.LowerCaseFilterFactory"/>
  109. <filter class="solr.LowerCaseFilterFactory"/>
  110. <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_el.txt" enablePositionIncrements="true"/>
  111. <filter class="solr.GreekLowerCaseFilterFactory"/>
  112. <filter class="solr.GreekStemFilterFactory"/>
  113. <filter class="solr.HunspellStemFilterFactory" dictionary="dictionaries/el_GR.dic" affix="dictionaries/el_GR.aff" ignoreCase="true" />
  114. </analyzer>
  115. </fieldType>
  116.  
  117. <fields>
  118. <field name="ida" type="string" indexed="true" stored="true" multiValued="false"/>
  119. <field name="solr_id" type="string" indexed="true" stored="true" multiValued="false"/>
  120. <field name="title" type="text_ktimatologio" indexed="true" stored="true"/>
  121. <field name="grid_title" type="text_ktimatologio" indexed="true" stored="true"/>
  122. <field name="model" type="string" indexed="true" stored="true" multiValued="false"/>
  123. <field name="type" type="string" indexed="true" stored="true"/>
  124. <field name="url" type="string" indexed="true" stored="true"/>
  125. <field name="last_modified" type="string" indexed="true" stored="true"/>
  126. <field name="search_tag" type="string" indexed="true" stored="true"/>
  127. <field name="contentbin" type="text" indexed="true" stored="true" multiValued="true"/>
  128. <field name="content" type="text_ktimatologio" indexed="true" stored="true" multiValued="true"/>
  129. </fields>
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement