smartcloud 0.0.31

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (192) hide show
  1. checksums.yaml +7 -0
  2. data/MIT-LICENSE +21 -0
  3. data/README.md +79 -0
  4. data/bin/runner +20 -0
  5. data/bin/smartcloud +54 -0
  6. data/lib/smartcloud.rb +16 -0
  7. data/lib/smartcloud/boot.rb +93 -0
  8. data/lib/smartcloud/docker.rb +120 -0
  9. data/lib/smartcloud/grids/grid-mysql/docker-entrypoint-initdb.d/.keep +0 -0
  10. data/lib/smartcloud/grids/grid-nginx/fastcgi.conf +9 -0
  11. data/lib/smartcloud/grids/grid-nginx/nginx.tmpl +373 -0
  12. data/lib/smartcloud/grids/grid-runner/Dockerfile +27 -0
  13. data/lib/smartcloud/grids/grid-runner/buildpacks/rails/Dockerfile +30 -0
  14. data/lib/smartcloud/grids/grid-solr/docker-entrypoint-initdb.d/.keep +0 -0
  15. data/lib/smartcloud/grids/grid-solr/sunspot/conf/schema.xml +278 -0
  16. data/lib/smartcloud/grids/grid-solr/sunspot/conf/solrconfig.xml +632 -0
  17. data/lib/smartcloud/grids/mysql.rb +60 -0
  18. data/lib/smartcloud/grids/nginx.rb +133 -0
  19. data/lib/smartcloud/grids/runner.rb +373 -0
  20. data/lib/smartcloud/grids/solr.rb +92 -0
  21. data/lib/smartcloud/machine.rb +63 -0
  22. data/lib/smartcloud/templates/dotsmartcloud/config/environment.rb +13 -0
  23. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-mysql/data/.keep +0 -0
  24. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-nginx/certificates/.keep +0 -0
  25. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-nginx/htpasswd/.keep +0 -0
  26. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-nginx/users.yml +1 -0
  27. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-runner/apps/containers/.keep +0 -0
  28. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-runner/apps/repositories/.keep +0 -0
  29. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-runner/buildpacks/rails/gems/.keep +0 -0
  30. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-runner/pre-receive +13 -0
  31. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/.keep +0 -0
  32. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/README.txt +77 -0
  33. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/contractions_ca.txt +8 -0
  34. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/contractions_fr.txt +15 -0
  35. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/contractions_ga.txt +5 -0
  36. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/contractions_it.txt +23 -0
  37. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/hyphenations_ga.txt +5 -0
  38. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stemdict_nl.txt +6 -0
  39. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stoptags_ja.txt +420 -0
  40. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_ar.txt +125 -0
  41. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_bg.txt +193 -0
  42. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_ca.txt +220 -0
  43. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_cz.txt +172 -0
  44. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_da.txt +110 -0
  45. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_de.txt +294 -0
  46. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_el.txt +78 -0
  47. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_en.txt +54 -0
  48. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_es.txt +356 -0
  49. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_eu.txt +99 -0
  50. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_fa.txt +313 -0
  51. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_fi.txt +97 -0
  52. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_fr.txt +186 -0
  53. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_ga.txt +110 -0
  54. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_gl.txt +161 -0
  55. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_hi.txt +235 -0
  56. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_hu.txt +211 -0
  57. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_hy.txt +46 -0
  58. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_id.txt +359 -0
  59. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_it.txt +303 -0
  60. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_ja.txt +127 -0
  61. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_lv.txt +172 -0
  62. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_nl.txt +119 -0
  63. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_no.txt +194 -0
  64. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_pt.txt +253 -0
  65. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_ro.txt +233 -0
  66. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_ru.txt +243 -0
  67. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_sv.txt +133 -0
  68. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_th.txt +119 -0
  69. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/stopwords_tr.txt +212 -0
  70. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/lang/userdict_ja.txt +29 -0
  71. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/managed-schema +1007 -0
  72. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/params.json +20 -0
  73. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/protwords.txt +21 -0
  74. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/solrconfig.xml +1355 -0
  75. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/stopwords.txt +14 -0
  76. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/_default/conf/synonyms.txt +29 -0
  77. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/_rest_managed.json +1 -0
  78. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/_schema_analysis_stopwords_english.json +38 -0
  79. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/_schema_analysis_synonyms_english.json +11 -0
  80. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/clustering/carrot2/README.txt +11 -0
  81. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/clustering/carrot2/kmeans-attributes.xml +19 -0
  82. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/clustering/carrot2/lingo-attributes.xml +24 -0
  83. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/clustering/carrot2/stc-attributes.xml +19 -0
  84. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/currency.xml +67 -0
  85. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/elevate.xml +42 -0
  86. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/contractions_ca.txt +8 -0
  87. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/contractions_fr.txt +15 -0
  88. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/contractions_ga.txt +5 -0
  89. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/contractions_it.txt +23 -0
  90. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/hyphenations_ga.txt +5 -0
  91. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stemdict_nl.txt +6 -0
  92. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stoptags_ja.txt +420 -0
  93. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_ar.txt +125 -0
  94. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_bg.txt +193 -0
  95. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_ca.txt +220 -0
  96. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_ckb.txt +136 -0
  97. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_cz.txt +172 -0
  98. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_da.txt +110 -0
  99. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_de.txt +294 -0
  100. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_el.txt +78 -0
  101. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_en.txt +54 -0
  102. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_es.txt +356 -0
  103. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_eu.txt +99 -0
  104. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_fa.txt +313 -0
  105. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_fi.txt +97 -0
  106. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_fr.txt +186 -0
  107. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_ga.txt +110 -0
  108. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_gl.txt +161 -0
  109. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_hi.txt +235 -0
  110. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_hu.txt +211 -0
  111. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_hy.txt +46 -0
  112. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_id.txt +359 -0
  113. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_it.txt +303 -0
  114. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_ja.txt +127 -0
  115. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_lv.txt +172 -0
  116. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_nl.txt +119 -0
  117. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_no.txt +194 -0
  118. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_pt.txt +253 -0
  119. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_ro.txt +233 -0
  120. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_ru.txt +243 -0
  121. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_sv.txt +133 -0
  122. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_th.txt +119 -0
  123. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/stopwords_tr.txt +212 -0
  124. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/lang/userdict_ja.txt +29 -0
  125. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/managed-schema +1187 -0
  126. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/mapping-FoldToASCII.txt +3813 -0
  127. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/mapping-ISOLatin1Accent.txt +246 -0
  128. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/params.json +11 -0
  129. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/protwords.txt +21 -0
  130. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/solrconfig.xml +1616 -0
  131. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/spellings.txt +2 -0
  132. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/stopwords.txt +14 -0
  133. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/synonyms.txt +29 -0
  134. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/update-script.js +53 -0
  135. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/README.txt +101 -0
  136. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/VM_global_library.vm +186 -0
  137. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/browse.vm +33 -0
  138. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/cluster.vm +19 -0
  139. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/cluster_results.vm +31 -0
  140. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/debug.vm +28 -0
  141. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/did_you_mean.vm +11 -0
  142. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/error.vm +11 -0
  143. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/facet_fields.vm +24 -0
  144. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/facet_pivot.vm +12 -0
  145. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/facet_queries.vm +12 -0
  146. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/facet_ranges.vm +23 -0
  147. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/facets.vm +10 -0
  148. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/footer.vm +43 -0
  149. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/head.vm +37 -0
  150. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/header.vm +7 -0
  151. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/hit.vm +25 -0
  152. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/hit_grouped.vm +43 -0
  153. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/hit_plain.vm +25 -0
  154. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/join_doc.vm +20 -0
  155. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/jquery.autocomplete.css +48 -0
  156. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/jquery.autocomplete.js +763 -0
  157. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/layout.vm +24 -0
  158. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/main.css +231 -0
  159. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/mime_type_lists.vm +68 -0
  160. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/pagination_bottom.vm +22 -0
  161. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/pagination_top.vm +29 -0
  162. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/product_doc.vm +32 -0
  163. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/query.vm +42 -0
  164. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/query_form.vm +64 -0
  165. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/query_group.vm +43 -0
  166. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/query_spatial.vm +75 -0
  167. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/results_list.vm +22 -0
  168. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/richtext_doc.vm +153 -0
  169. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/suggest.vm +8 -0
  170. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/velocity/tabs.vm +50 -0
  171. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/xslt/example.xsl +132 -0
  172. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/xslt/example_atom.xsl +67 -0
  173. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/xslt/example_rss.xsl +66 -0
  174. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/xslt/luke.xsl +337 -0
  175. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sample_techproducts_configs/conf/xslt/updateXml.xsl +70 -0
  176. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sunspot/conf/_rest_managed.json +1 -0
  177. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sunspot/conf/admin-extra.html +31 -0
  178. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sunspot/conf/currency.xml +67 -0
  179. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sunspot/conf/elevate.xml +36 -0
  180. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sunspot/conf/lang/stopwords_en.txt +54 -0
  181. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sunspot/conf/mapping-ISOLatin1Accent.txt +246 -0
  182. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sunspot/conf/protwords.txt +21 -0
  183. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sunspot/conf/schema.xml +278 -0
  184. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sunspot/conf/scripts.conf +24 -0
  185. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sunspot/conf/solrconfig.xml +632 -0
  186. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sunspot/conf/spellings.txt +2 -0
  187. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/configsets/sunspot/conf/synonyms.txt +29 -0
  188. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/lib/.keep +0 -0
  189. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/solr.xml +53 -0
  190. data/lib/smartcloud/templates/dotsmartcloud/grids/grid-solr/data/zoo.cfg +31 -0
  191. data/lib/smartcloud/user.rb +72 -0
  192. metadata +237 -0
@@ -0,0 +1,212 @@
1
+ # Turkish stopwords from LUCENE-559
2
+ # merged with the list from "Information Retrieval on Turkish Texts"
3
+ # (http://www.users.muohio.edu/canf/papers/JASIST2008offPrint.pdf)
4
+ acaba
5
+ altmış
6
+ altı
7
+ ama
8
+ ancak
9
+ arada
10
+ aslında
11
+ ayrıca
12
+ bana
13
+ bazı
14
+ belki
15
+ ben
16
+ benden
17
+ beni
18
+ benim
19
+ beri
20
+ beş
21
+ bile
22
+ bin
23
+ bir
24
+ birçok
25
+ biri
26
+ birkaç
27
+ birkez
28
+ birşey
29
+ birşeyi
30
+ biz
31
+ bize
32
+ bizden
33
+ bizi
34
+ bizim
35
+ böyle
36
+ böylece
37
+ bu
38
+ buna
39
+ bunda
40
+ bundan
41
+ bunlar
42
+ bunları
43
+ bunların
44
+ bunu
45
+ bunun
46
+ burada
47
+ çok
48
+ çünkü
49
+ da
50
+ daha
51
+ dahi
52
+ de
53
+ defa
54
+ değil
55
+ diğer
56
+ diye
57
+ doksan
58
+ dokuz
59
+ dolayı
60
+ dolayısıyla
61
+ dört
62
+ edecek
63
+ eden
64
+ ederek
65
+ edilecek
66
+ ediliyor
67
+ edilmesi
68
+ ediyor
69
+ eğer
70
+ elli
71
+ en
72
+ etmesi
73
+ etti
74
+ ettiği
75
+ ettiğini
76
+ gibi
77
+ göre
78
+ halen
79
+ hangi
80
+ hatta
81
+ hem
82
+ henüz
83
+ hep
84
+ hepsi
85
+ her
86
+ herhangi
87
+ herkesin
88
+ hiç
89
+ hiçbir
90
+ için
91
+ iki
92
+ ile
93
+ ilgili
94
+ ise
95
+ işte
96
+ itibaren
97
+ itibariyle
98
+ kadar
99
+ karşın
100
+ katrilyon
101
+ kendi
102
+ kendilerine
103
+ kendini
104
+ kendisi
105
+ kendisine
106
+ kendisini
107
+ kez
108
+ ki
109
+ kim
110
+ kimden
111
+ kime
112
+ kimi
113
+ kimse
114
+ kırk
115
+ milyar
116
+ milyon
117
+ mu
118
+
119
+
120
+ nasıl
121
+ ne
122
+ neden
123
+ nedenle
124
+ nerde
125
+ nerede
126
+ nereye
127
+ niye
128
+ niçin
129
+ o
130
+ olan
131
+ olarak
132
+ oldu
133
+ olduğu
134
+ olduğunu
135
+ olduklarını
136
+ olmadı
137
+ olmadığı
138
+ olmak
139
+ olması
140
+ olmayan
141
+ olmaz
142
+ olsa
143
+ olsun
144
+ olup
145
+ olur
146
+ olursa
147
+ oluyor
148
+ on
149
+ ona
150
+ ondan
151
+ onlar
152
+ onlardan
153
+ onları
154
+ onların
155
+ onu
156
+ onun
157
+ otuz
158
+ oysa
159
+ öyle
160
+ pek
161
+ rağmen
162
+ sadece
163
+ sanki
164
+ sekiz
165
+ seksen
166
+ sen
167
+ senden
168
+ seni
169
+ senin
170
+ siz
171
+ sizden
172
+ sizi
173
+ sizin
174
+ şey
175
+ şeyden
176
+ şeyi
177
+ şeyler
178
+ şöyle
179
+ şu
180
+ şuna
181
+ şunda
182
+ şundan
183
+ şunları
184
+ şunu
185
+ tarafından
186
+ trilyon
187
+ tüm
188
+ üç
189
+ üzere
190
+ var
191
+ vardı
192
+ ve
193
+ veya
194
+ ya
195
+ yani
196
+ yapacak
197
+ yapılan
198
+ yapılması
199
+ yapıyor
200
+ yapmak
201
+ yaptı
202
+ yaptığı
203
+ yaptığını
204
+ yaptıkları
205
+ yedi
206
+ yerine
207
+ yetmiş
208
+ yine
209
+ yirmi
210
+ yoksa
211
+ yüz
212
+ zaten
@@ -0,0 +1,29 @@
1
+ #
2
+ # This is a sample user dictionary for Kuromoji (JapaneseTokenizer)
3
+ #
4
+ # Add entries to this file in order to override the statistical model in terms
5
+ # of segmentation, readings and part-of-speech tags. Notice that entries do
6
+ # not have weights since they are always used when found. This is by-design
7
+ # in order to maximize ease-of-use.
8
+ #
9
+ # Entries are defined using the following CSV format:
10
+ # <text>,<token 1> ... <token n>,<reading 1> ... <reading n>,<part-of-speech tag>
11
+ #
12
+ # Notice that a single half-width space separates tokens and readings, and
13
+ # that the number tokens and readings must match exactly.
14
+ #
15
+ # Also notice that multiple entries with the same <text> is undefined.
16
+ #
17
+ # Whitespace only lines are ignored. Comments are not allowed on entry lines.
18
+ #
19
+
20
+ # Custom segmentation for kanji compounds
21
+ 日本経済新聞,日本 経済 新聞,ニホン ケイザイ シンブン,カスタム名詞
22
+ 関西国際空港,関西 国際 空港,カンサイ コクサイ クウコウ,カスタム名詞
23
+
24
+ # Custom segmentation for compound katakana
25
+ トートバッグ,トート バッグ,トート バッグ,かずカナ名詞
26
+ ショルダーバッグ,ショルダー バッグ,ショルダー バッグ,かずカナ名詞
27
+
28
+ # Custom reading for former sumo wrestler
29
+ 朝青龍,朝青龍,アサショウリュウ,カスタム人名
@@ -0,0 +1,1007 @@
1
+ <?xml version="1.0" encoding="UTF-8" ?>
2
+ <!--
3
+ Licensed to the Apache Software Foundation (ASF) under one or more
4
+ contributor license agreements. See the NOTICE file distributed with
5
+ this work for additional information regarding copyright ownership.
6
+ The ASF licenses this file to You under the Apache License, Version 2.0
7
+ (the "License"); you may not use this file except in compliance with
8
+ the License. You may obtain a copy of the License at
9
+
10
+ http://www.apache.org/licenses/LICENSE-2.0
11
+
12
+ Unless required by applicable law or agreed to in writing, software
13
+ distributed under the License is distributed on an "AS IS" BASIS,
14
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
+ See the License for the specific language governing permissions and
16
+ limitations under the License.
17
+ -->
18
+
19
+ <!--
20
+
21
+ This example schema is the recommended starting point for users.
22
+ It should be kept correct and concise, usable out-of-the-box.
23
+
24
+
25
+ For more information, on how to customize this file, please see
26
+ http://lucene.apache.org/solr/guide/documents-fields-and-schema-design.html
27
+
28
+ PERFORMANCE NOTE: this schema includes many optional features and should not
29
+ be used for benchmarking. To improve performance one could
30
+ - set stored="false" for all fields possible (esp large fields) when you
31
+ only need to search on the field but don't need to return the original
32
+ value.
33
+ - set indexed="false" if you don't need to search on the field, but only
34
+ return the field as a result of searching on other indexed fields.
35
+ - remove all unneeded copyField statements
36
+ - for best index size and searching performance, set "index" to false
37
+ for all general text fields, use copyField to copy them to the
38
+ catchall "text" field, and use that for searching.
39
+ -->
40
+
41
+ <schema name="default-config" version="1.6">
42
+ <!-- attribute "name" is the name of this schema and is only used for display purposes.
43
+ version="x.y" is Solr's version number for the schema syntax and
44
+ semantics. It should not normally be changed by applications.
45
+
46
+ 1.0: multiValued attribute did not exist, all fields are multiValued
47
+ by nature
48
+ 1.1: multiValued attribute introduced, false by default
49
+ 1.2: omitTermFreqAndPositions attribute introduced, true by default
50
+ except for text fields.
51
+ 1.3: removed optional field compress feature
52
+ 1.4: autoGeneratePhraseQueries attribute introduced to drive QueryParser
53
+ behavior when a single string produces multiple tokens. Defaults
54
+ to off for version >= 1.4
55
+ 1.5: omitNorms defaults to true for primitive field types
56
+ (int, float, boolean, string...)
57
+ 1.6: useDocValuesAsStored defaults to true.
58
+ -->
59
+
60
+ <!-- Valid attributes for fields:
61
+ name: mandatory - the name for the field
62
+ type: mandatory - the name of a field type from the
63
+ fieldTypes section
64
+ indexed: true if this field should be indexed (searchable or sortable)
65
+ stored: true if this field should be retrievable
66
+ docValues: true if this field should have doc values. Doc Values is
67
+ recommended (required, if you are using *Point fields) for faceting,
68
+ grouping, sorting and function queries. Doc Values will make the index
69
+ faster to load, more NRT-friendly and more memory-efficient.
70
+ They are currently only supported by StrField, UUIDField, all
71
+ *PointFields, and depending on the field type, they might require
72
+ the field to be single-valued, be required or have a default value
73
+ (check the documentation of the field type you're interested in for
74
+ more information)
75
+ multiValued: true if this field may contain multiple values per document
76
+ omitNorms: (expert) set to true to omit the norms associated with
77
+ this field (this disables length normalization and index-time
78
+ boosting for the field, and saves some memory). Only full-text
79
+ fields or fields that need an index-time boost need norms.
80
+ Norms are omitted for primitive (non-analyzed) types by default.
81
+ termVectors: [false] set to true to store the term vector for a
82
+ given field.
83
+ When using MoreLikeThis, fields used for similarity should be
84
+ stored for best performance.
85
+ termPositions: Store position information with the term vector.
86
+ This will increase storage costs.
87
+ termOffsets: Store offset information with the term vector. This
88
+ will increase storage costs.
89
+ required: The field is required. It will throw an error if the
90
+ value does not exist
91
+ default: a value that should be used if no value is specified
92
+ when adding a document.
93
+ -->
94
+
95
+ <!-- field names should consist of alphanumeric or underscore characters only and
96
+ not start with a digit. This is not currently strictly enforced,
97
+ but other field names will not have first class support from all components
98
+ and back compatibility is not guaranteed. Names with both leading and
99
+ trailing underscores (e.g. _version_) are reserved.
100
+ -->
101
+
102
+ <!-- In this _default configset, only four fields are pre-declared:
103
+ id, _version_, and _text_ and _root_. All other fields will be type guessed and added via the
104
+ "add-unknown-fields-to-the-schema" update request processor chain declared in solrconfig.xml.
105
+
106
+ Note that many dynamic fields are also defined - you can use them to specify a
107
+ field's type via field naming conventions - see below.
108
+
109
+ WARNING: The _text_ catch-all field will significantly increase your index size.
110
+ If you don't need it, consider removing it and the corresponding copyField directive.
111
+ -->
112
+
113
+ <field name="id" type="string" indexed="true" stored="true" required="true" multiValued="false" />
114
+ <!-- docValues are enabled by default for long type so we don't need to index the version field -->
115
+ <field name="_version_" type="plong" indexed="false" stored="false"/>
116
+ <field name="_root_" type="string" indexed="true" stored="false" docValues="false" />
117
+ <field name="_text_" type="text_general" indexed="true" stored="false" multiValued="true"/>
118
+
119
+ <!-- This can be enabled, in case the client does not know what fields may be searched. It isn't enabled by default
120
+ because it's very expensive to index everything twice. -->
121
+ <!-- <copyField source="*" dest="_text_"/> -->
122
+
123
+ <!-- Dynamic field definitions allow using convention over configuration
124
+ for fields via the specification of patterns to match field names.
125
+ EXAMPLE: name="*_i" will match any field ending in _i (like myid_i, z_i)
126
+ RESTRICTION: the glob-like pattern in the name attribute must have a "*" only at the start or the end. -->
127
+
128
+ <dynamicField name="*_i" type="pint" indexed="true" stored="true"/>
129
+ <dynamicField name="*_is" type="pints" indexed="true" stored="true"/>
130
+ <dynamicField name="*_s" type="string" indexed="true" stored="true" />
131
+ <dynamicField name="*_ss" type="strings" indexed="true" stored="true"/>
132
+ <dynamicField name="*_l" type="plong" indexed="true" stored="true"/>
133
+ <dynamicField name="*_ls" type="plongs" indexed="true" stored="true"/>
134
+ <dynamicField name="*_t" type="text_general" indexed="true" stored="true" multiValued="false"/>
135
+ <dynamicField name="*_txt" type="text_general" indexed="true" stored="true"/>
136
+ <dynamicField name="*_b" type="boolean" indexed="true" stored="true"/>
137
+ <dynamicField name="*_bs" type="booleans" indexed="true" stored="true"/>
138
+ <dynamicField name="*_f" type="pfloat" indexed="true" stored="true"/>
139
+ <dynamicField name="*_fs" type="pfloats" indexed="true" stored="true"/>
140
+ <dynamicField name="*_d" type="pdouble" indexed="true" stored="true"/>
141
+ <dynamicField name="*_ds" type="pdoubles" indexed="true" stored="true"/>
142
+ <dynamicField name="random_*" type="random"/>
143
+ <dynamicField name="ignored_*" type="ignored"/>
144
+
145
+ <!-- Type used for data-driven schema, to add a string copy for each text field -->
146
+ <dynamicField name="*_str" type="strings" stored="false" docValues="true" indexed="false" useDocValuesAsStored="false"/>
147
+
148
+ <dynamicField name="*_dt" type="pdate" indexed="true" stored="true"/>
149
+ <dynamicField name="*_dts" type="pdate" indexed="true" stored="true" multiValued="true"/>
150
+ <dynamicField name="*_p" type="location" indexed="true" stored="true"/>
151
+ <dynamicField name="*_srpt" type="location_rpt" indexed="true" stored="true"/>
152
+
153
+ <!-- payloaded dynamic fields -->
154
+ <dynamicField name="*_dpf" type="delimited_payloads_float" indexed="true" stored="true"/>
155
+ <dynamicField name="*_dpi" type="delimited_payloads_int" indexed="true" stored="true"/>
156
+ <dynamicField name="*_dps" type="delimited_payloads_string" indexed="true" stored="true"/>
157
+
158
+ <dynamicField name="attr_*" type="text_general" indexed="true" stored="true" multiValued="true"/>
159
+
160
+ <!-- Field to use to determine and enforce document uniqueness.
161
+ Unless this field is marked with required="false", it will be a required field
162
+ -->
163
+ <uniqueKey>id</uniqueKey>
164
+
165
+ <!-- copyField commands copy one field to another at the time a document
166
+ is added to the index. It's used either to index the same field differently,
167
+ or to add multiple fields to the same field for easier/faster searching.
168
+
169
+ <copyField source="sourceFieldName" dest="destinationFieldName"/>
170
+ -->
171
+
172
+ <!-- field type definitions. The "name" attribute is
173
+ just a label to be used by field definitions. The "class"
174
+ attribute and any other attributes determine the real
175
+ behavior of the fieldType.
176
+ Class names starting with "solr" refer to java classes in a
177
+ standard package such as org.apache.solr.analysis
178
+ -->
179
+
180
+ <!-- sortMissingLast and sortMissingFirst attributes are optional attributes are
181
+ currently supported on types that are sorted internally as strings
182
+ and on numeric types.
183
+ This includes "string", "boolean", "pint", "pfloat", "plong", "pdate", "pdouble".
184
+ - If sortMissingLast="true", then a sort on this field will cause documents
185
+ without the field to come after documents with the field,
186
+ regardless of the requested sort order (asc or desc).
187
+ - If sortMissingFirst="true", then a sort on this field will cause documents
188
+ without the field to come before documents with the field,
189
+ regardless of the requested sort order.
190
+ - If sortMissingLast="false" and sortMissingFirst="false" (the default),
191
+ then default lucene sorting will be used which places docs without the
192
+ field first in an ascending sort and last in a descending sort.
193
+ -->
194
+
195
+ <!-- The StrField type is not analyzed, but indexed/stored verbatim. -->
196
+ <fieldType name="string" class="solr.StrField" sortMissingLast="true" docValues="true" />
197
+ <fieldType name="strings" class="solr.StrField" sortMissingLast="true" multiValued="true" docValues="true" />
198
+
199
+ <!-- boolean type: "true" or "false" -->
200
+ <fieldType name="boolean" class="solr.BoolField" sortMissingLast="true"/>
201
+ <fieldType name="booleans" class="solr.BoolField" sortMissingLast="true" multiValued="true"/>
202
+
203
+ <!--
204
+ Numeric field types that index values using KD-trees.
205
+ Point fields don't support FieldCache, so they must have docValues="true" if needed for sorting, faceting, functions, etc.
206
+ -->
207
+ <fieldType name="pint" class="solr.IntPointField" docValues="true"/>
208
+ <fieldType name="pfloat" class="solr.FloatPointField" docValues="true"/>
209
+ <fieldType name="plong" class="solr.LongPointField" docValues="true"/>
210
+ <fieldType name="pdouble" class="solr.DoublePointField" docValues="true"/>
211
+
212
+ <fieldType name="pints" class="solr.IntPointField" docValues="true" multiValued="true"/>
213
+ <fieldType name="pfloats" class="solr.FloatPointField" docValues="true" multiValued="true"/>
214
+ <fieldType name="plongs" class="solr.LongPointField" docValues="true" multiValued="true"/>
215
+ <fieldType name="pdoubles" class="solr.DoublePointField" docValues="true" multiValued="true"/>
216
+ <fieldType name="random" class="solr.RandomSortField" indexed="true"/>
217
+
218
+ <!-- since fields of this type are by default not stored or indexed,
219
+ any data added to them will be ignored outright. -->
220
+ <fieldType name="ignored" stored="false" indexed="false" multiValued="true" class="solr.StrField" />
221
+
222
+ <!-- The format for this date field is of the form 1995-12-31T23:59:59Z, and
223
+ is a more restricted form of the canonical representation of dateTime
224
+ http://www.w3.org/TR/xmlschema-2/#dateTime
225
+ The trailing "Z" designates UTC time and is mandatory.
226
+ Optional fractional seconds are allowed: 1995-12-31T23:59:59.999Z
227
+ All other components are mandatory.
228
+
229
+ Expressions can also be used to denote calculations that should be
230
+ performed relative to "NOW" to determine the value, ie...
231
+
232
+ NOW/HOUR
233
+ ... Round to the start of the current hour
234
+ NOW-1DAY
235
+ ... Exactly 1 day prior to now
236
+ NOW/DAY+6MONTHS+3DAYS
237
+ ... 6 months and 3 days in the future from the start of
238
+ the current day
239
+
240
+ -->
241
+ <!-- KD-tree versions of date fields -->
242
+ <fieldType name="pdate" class="solr.DatePointField" docValues="true"/>
243
+ <fieldType name="pdates" class="solr.DatePointField" docValues="true" multiValued="true"/>
244
+
245
+ <!--Binary data type. The data should be sent/retrieved in as Base64 encoded Strings -->
246
+ <fieldType name="binary" class="solr.BinaryField"/>
247
+
248
+ <!-- solr.TextField allows the specification of custom text analyzers
249
+ specified as a tokenizer and a list of token filters. Different
250
+ analyzers may be specified for indexing and querying.
251
+
252
+ The optional positionIncrementGap puts space between multiple fields of
253
+ this type on the same document, with the purpose of preventing false phrase
254
+ matching across fields.
255
+
256
+ For more info on customizing your analyzer chain, please see
257
+ http://lucene.apache.org/solr/guide/understanding-analyzers-tokenizers-and-filters.html#understanding-analyzers-tokenizers-and-filters
258
+ -->
259
+
260
+ <!-- One can also specify an existing Analyzer class that has a
261
+ default constructor via the class attribute on the analyzer element.
262
+ Example:
263
+ <fieldType name="text_greek" class="solr.TextField">
264
+ <analyzer class="org.apache.lucene.analysis.el.GreekAnalyzer"/>
265
+ </fieldType>
266
+ -->
267
+
268
+ <!-- A text field that only splits on whitespace for exact matching of words -->
269
+ <dynamicField name="*_ws" type="text_ws" indexed="true" stored="true"/>
270
+ <fieldType name="text_ws" class="solr.TextField" positionIncrementGap="100">
271
+ <analyzer>
272
+ <tokenizer class="solr.WhitespaceTokenizerFactory"/>
273
+ </analyzer>
274
+ </fieldType>
275
+
276
+ <!-- A general text field that has reasonable, generic
277
+ cross-language defaults: it tokenizes with StandardTokenizer,
278
+ removes stop words from case-insensitive "stopwords.txt"
279
+ (empty by default), and down cases. At query time only, it
280
+ also applies synonyms.
281
+ -->
282
+ <fieldType name="text_general" class="solr.TextField" positionIncrementGap="100" multiValued="true">
283
+ <analyzer type="index">
284
+ <tokenizer class="solr.StandardTokenizerFactory"/>
285
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords.txt" />
286
+ <!-- in this example, we will only use synonyms at query time
287
+ <filter class="solr.SynonymGraphFilterFactory" synonyms="index_synonyms.txt" ignoreCase="true" expand="false"/>
288
+ <filter class="solr.FlattenGraphFilterFactory"/>
289
+ -->
290
+ <filter class="solr.LowerCaseFilterFactory"/>
291
+ </analyzer>
292
+ <analyzer type="query">
293
+ <tokenizer class="solr.StandardTokenizerFactory"/>
294
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords.txt" />
295
+ <filter class="solr.SynonymGraphFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="true"/>
296
+ <filter class="solr.LowerCaseFilterFactory"/>
297
+ </analyzer>
298
+ </fieldType>
299
+
300
+
301
+ <!-- SortableTextField generaly functions exactly like TextField,
302
+ except that it supports, and by default uses, docValues for sorting (or faceting)
303
+ on the first 1024 characters of the original field values (which is configurable).
304
+
305
+ This makes it a bit more useful then TextField in many situations, but the trade-off
306
+ is that it takes up more space on disk; which is why it's not used in place of TextField
307
+ for every fieldType in this _default schema.
308
+ -->
309
+ <dynamicField name="*_t_sort" type="text_gen_sort" indexed="true" stored="true" multiValued="false"/>
310
+ <dynamicField name="*_txt_sort" type="text_gen_sort" indexed="true" stored="true"/>
311
+ <fieldType name="text_gen_sort" class="solr.SortableTextField" positionIncrementGap="100" multiValued="true">
312
+ <analyzer type="index">
313
+ <tokenizer class="solr.StandardTokenizerFactory"/>
314
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords.txt" />
315
+ <filter class="solr.LowerCaseFilterFactory"/>
316
+ </analyzer>
317
+ <analyzer type="query">
318
+ <tokenizer class="solr.StandardTokenizerFactory"/>
319
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords.txt" />
320
+ <filter class="solr.SynonymGraphFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="true"/>
321
+ <filter class="solr.LowerCaseFilterFactory"/>
322
+ </analyzer>
323
+ </fieldType>
324
+
325
+ <!-- A text field with defaults appropriate for English: it tokenizes with StandardTokenizer,
326
+ removes English stop words (lang/stopwords_en.txt), down cases, protects words from protwords.txt, and
327
+ finally applies Porter's stemming. The query time analyzer also applies synonyms from synonyms.txt. -->
328
+ <dynamicField name="*_txt_en" type="text_en" indexed="true" stored="true"/>
329
+ <fieldType name="text_en" class="solr.TextField" positionIncrementGap="100">
330
+ <analyzer type="index">
331
+ <tokenizer class="solr.StandardTokenizerFactory"/>
332
+ <!-- in this example, we will only use synonyms at query time
333
+ <filter class="solr.SynonymGraphFilterFactory" synonyms="index_synonyms.txt" ignoreCase="true" expand="false"/>
334
+ <filter class="solr.FlattenGraphFilterFactory"/>
335
+ -->
336
+ <!-- Case insensitive stop word removal.
337
+ -->
338
+ <filter class="solr.StopFilterFactory"
339
+ ignoreCase="true"
340
+ words="lang/stopwords_en.txt"
341
+ />
342
+ <filter class="solr.LowerCaseFilterFactory"/>
343
+ <filter class="solr.EnglishPossessiveFilterFactory"/>
344
+ <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
345
+ <!-- Optionally you may want to use this less aggressive stemmer instead of PorterStemFilterFactory:
346
+ <filter class="solr.EnglishMinimalStemFilterFactory"/>
347
+ -->
348
+ <filter class="solr.PorterStemFilterFactory"/>
349
+ </analyzer>
350
+ <analyzer type="query">
351
+ <tokenizer class="solr.StandardTokenizerFactory"/>
352
+ <filter class="solr.SynonymGraphFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="true"/>
353
+ <filter class="solr.StopFilterFactory"
354
+ ignoreCase="true"
355
+ words="lang/stopwords_en.txt"
356
+ />
357
+ <filter class="solr.LowerCaseFilterFactory"/>
358
+ <filter class="solr.EnglishPossessiveFilterFactory"/>
359
+ <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
360
+ <!-- Optionally you may want to use this less aggressive stemmer instead of PorterStemFilterFactory:
361
+ <filter class="solr.EnglishMinimalStemFilterFactory"/>
362
+ -->
363
+ <filter class="solr.PorterStemFilterFactory"/>
364
+ </analyzer>
365
+ </fieldType>
366
+
367
+ <!-- A text field with defaults appropriate for English, plus
368
+ aggressive word-splitting and autophrase features enabled.
369
+ This field is just like text_en, except it adds
370
+ WordDelimiterGraphFilter to enable splitting and matching of
371
+ words on case-change, alpha numeric boundaries, and
372
+ non-alphanumeric chars. This means certain compound word
373
+ cases will work, for example query "wi fi" will match
374
+ document "WiFi" or "wi-fi".
375
+ -->
376
+ <dynamicField name="*_txt_en_split" type="text_en_splitting" indexed="true" stored="true"/>
377
+ <fieldType name="text_en_splitting" class="solr.TextField" positionIncrementGap="100" autoGeneratePhraseQueries="true">
378
+ <analyzer type="index">
379
+ <tokenizer class="solr.WhitespaceTokenizerFactory"/>
380
+ <!-- in this example, we will only use synonyms at query time
381
+ <filter class="solr.SynonymGraphFilterFactory" synonyms="index_synonyms.txt" ignoreCase="true" expand="false"/>
382
+ -->
383
+ <!-- Case insensitive stop word removal.
384
+ -->
385
+ <filter class="solr.StopFilterFactory"
386
+ ignoreCase="true"
387
+ words="lang/stopwords_en.txt"
388
+ />
389
+ <filter class="solr.WordDelimiterGraphFilterFactory" generateWordParts="1" generateNumberParts="1" catenateWords="1" catenateNumbers="1" catenateAll="0" splitOnCaseChange="1"/>
390
+ <filter class="solr.LowerCaseFilterFactory"/>
391
+ <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
392
+ <filter class="solr.PorterStemFilterFactory"/>
393
+ <filter class="solr.FlattenGraphFilterFactory" />
394
+ </analyzer>
395
+ <analyzer type="query">
396
+ <tokenizer class="solr.WhitespaceTokenizerFactory"/>
397
+ <filter class="solr.SynonymGraphFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="true"/>
398
+ <filter class="solr.StopFilterFactory"
399
+ ignoreCase="true"
400
+ words="lang/stopwords_en.txt"
401
+ />
402
+ <filter class="solr.WordDelimiterGraphFilterFactory" generateWordParts="1" generateNumberParts="1" catenateWords="0" catenateNumbers="0" catenateAll="0" splitOnCaseChange="1"/>
403
+ <filter class="solr.LowerCaseFilterFactory"/>
404
+ <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
405
+ <filter class="solr.PorterStemFilterFactory"/>
406
+ </analyzer>
407
+ </fieldType>
408
+
409
+ <!-- Less flexible matching, but less false matches. Probably not ideal for product names,
410
+ but may be good for SKUs. Can insert dashes in the wrong place and still match. -->
411
+ <dynamicField name="*_txt_en_split_tight" type="text_en_splitting_tight" indexed="true" stored="true"/>
412
+ <fieldType name="text_en_splitting_tight" class="solr.TextField" positionIncrementGap="100" autoGeneratePhraseQueries="true">
413
+ <analyzer type="index">
414
+ <tokenizer class="solr.WhitespaceTokenizerFactory"/>
415
+ <filter class="solr.SynonymGraphFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="false"/>
416
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_en.txt"/>
417
+ <filter class="solr.WordDelimiterGraphFilterFactory" generateWordParts="0" generateNumberParts="0" catenateWords="1" catenateNumbers="1" catenateAll="0"/>
418
+ <filter class="solr.LowerCaseFilterFactory"/>
419
+ <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
420
+ <filter class="solr.EnglishMinimalStemFilterFactory"/>
421
+ <!-- this filter can remove any duplicate tokens that appear at the same position - sometimes
422
+ possible with WordDelimiterGraphFilter in conjuncton with stemming. -->
423
+ <filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
424
+ <filter class="solr.FlattenGraphFilterFactory" />
425
+ </analyzer>
426
+ <analyzer type="query">
427
+ <tokenizer class="solr.WhitespaceTokenizerFactory"/>
428
+ <filter class="solr.SynonymGraphFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="false"/>
429
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_en.txt"/>
430
+ <filter class="solr.WordDelimiterGraphFilterFactory" generateWordParts="0" generateNumberParts="0" catenateWords="1" catenateNumbers="1" catenateAll="0"/>
431
+ <filter class="solr.LowerCaseFilterFactory"/>
432
+ <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
433
+ <filter class="solr.EnglishMinimalStemFilterFactory"/>
434
+ <!-- this filter can remove any duplicate tokens that appear at the same position - sometimes
435
+ possible with WordDelimiterGraphFilter in conjuncton with stemming. -->
436
+ <filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
437
+ </analyzer>
438
+ </fieldType>
439
+
440
+ <!-- Just like text_general except it reverses the characters of
441
+ each token, to enable more efficient leading wildcard queries.
442
+ -->
443
+ <dynamicField name="*_txt_rev" type="text_general_rev" indexed="true" stored="true"/>
444
+ <fieldType name="text_general_rev" class="solr.TextField" positionIncrementGap="100">
445
+ <analyzer type="index">
446
+ <tokenizer class="solr.StandardTokenizerFactory"/>
447
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords.txt" />
448
+ <filter class="solr.LowerCaseFilterFactory"/>
449
+ <filter class="solr.ReversedWildcardFilterFactory" withOriginal="true"
450
+ maxPosAsterisk="3" maxPosQuestion="2" maxFractionAsterisk="0.33"/>
451
+ </analyzer>
452
+ <analyzer type="query">
453
+ <tokenizer class="solr.StandardTokenizerFactory"/>
454
+ <filter class="solr.SynonymGraphFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="true"/>
455
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords.txt" />
456
+ <filter class="solr.LowerCaseFilterFactory"/>
457
+ </analyzer>
458
+ </fieldType>
459
+
460
+ <dynamicField name="*_phon_en" type="phonetic_en" indexed="true" stored="true"/>
461
+ <fieldType name="phonetic_en" stored="false" indexed="true" class="solr.TextField" >
462
+ <analyzer>
463
+ <tokenizer class="solr.StandardTokenizerFactory"/>
464
+ <filter class="solr.DoubleMetaphoneFilterFactory" inject="false"/>
465
+ </analyzer>
466
+ </fieldType>
467
+
468
+ <!-- lowercases the entire field value, keeping it as a single token. -->
469
+ <dynamicField name="*_s_lower" type="lowercase" indexed="true" stored="true"/>
470
+ <fieldType name="lowercase" class="solr.TextField" positionIncrementGap="100">
471
+ <analyzer>
472
+ <tokenizer class="solr.KeywordTokenizerFactory"/>
473
+ <filter class="solr.LowerCaseFilterFactory" />
474
+ </analyzer>
475
+ </fieldType>
476
+
477
+ <!--
478
+ Example of using PathHierarchyTokenizerFactory at index time, so
479
+ queries for paths match documents at that path, or in descendent paths
480
+ -->
481
+ <dynamicField name="*_descendent_path" type="descendent_path" indexed="true" stored="true"/>
482
+ <fieldType name="descendent_path" class="solr.TextField">
483
+ <analyzer type="index">
484
+ <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="/" />
485
+ </analyzer>
486
+ <analyzer type="query">
487
+ <tokenizer class="solr.KeywordTokenizerFactory" />
488
+ </analyzer>
489
+ </fieldType>
490
+
491
+ <!--
492
+ Example of using PathHierarchyTokenizerFactory at query time, so
493
+ queries for paths match documents at that path, or in ancestor paths
494
+ -->
495
+ <dynamicField name="*_ancestor_path" type="ancestor_path" indexed="true" stored="true"/>
496
+ <fieldType name="ancestor_path" class="solr.TextField">
497
+ <analyzer type="index">
498
+ <tokenizer class="solr.KeywordTokenizerFactory" />
499
+ </analyzer>
500
+ <analyzer type="query">
501
+ <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="/" />
502
+ </analyzer>
503
+ </fieldType>
504
+
505
+ <!-- This point type indexes the coordinates as separate fields (subFields)
506
+ If subFieldType is defined, it references a type, and a dynamic field
507
+ definition is created matching *___<typename>. Alternately, if
508
+ subFieldSuffix is defined, that is used to create the subFields.
509
+ Example: if subFieldType="double", then the coordinates would be
510
+ indexed in fields myloc_0___double,myloc_1___double.
511
+ Example: if subFieldSuffix="_d" then the coordinates would be indexed
512
+ in fields myloc_0_d,myloc_1_d
513
+ The subFields are an implementation detail of the fieldType, and end
514
+ users normally should not need to know about them.
515
+ -->
516
+ <dynamicField name="*_point" type="point" indexed="true" stored="true"/>
517
+ <fieldType name="point" class="solr.PointType" dimension="2" subFieldSuffix="_d"/>
518
+
519
+ <!-- A specialized field for geospatial search filters and distance sorting. -->
520
+ <fieldType name="location" class="solr.LatLonPointSpatialField" docValues="true"/>
521
+
522
+ <!-- A geospatial field type that supports multiValued and polygon shapes.
523
+ For more information about this and other spatial fields see:
524
+ http://lucene.apache.org/solr/guide/spatial-search.html
525
+ -->
526
+ <fieldType name="location_rpt" class="solr.SpatialRecursivePrefixTreeFieldType"
527
+ geo="true" distErrPct="0.025" maxDistErr="0.001" distanceUnits="kilometers" />
528
+
529
+ <!-- Payloaded field types -->
530
+ <fieldType name="delimited_payloads_float" stored="false" indexed="true" class="solr.TextField">
531
+ <analyzer>
532
+ <tokenizer class="solr.WhitespaceTokenizerFactory"/>
533
+ <filter class="solr.DelimitedPayloadTokenFilterFactory" encoder="float"/>
534
+ </analyzer>
535
+ </fieldType>
536
+ <fieldType name="delimited_payloads_int" stored="false" indexed="true" class="solr.TextField">
537
+ <analyzer>
538
+ <tokenizer class="solr.WhitespaceTokenizerFactory"/>
539
+ <filter class="solr.DelimitedPayloadTokenFilterFactory" encoder="integer"/>
540
+ </analyzer>
541
+ </fieldType>
542
+ <fieldType name="delimited_payloads_string" stored="false" indexed="true" class="solr.TextField">
543
+ <analyzer>
544
+ <tokenizer class="solr.WhitespaceTokenizerFactory"/>
545
+ <filter class="solr.DelimitedPayloadTokenFilterFactory" encoder="identity"/>
546
+ </analyzer>
547
+ </fieldType>
548
+
549
+ <!-- some examples for different languages (generally ordered by ISO code) -->
550
+
551
+ <!-- Arabic -->
552
+ <dynamicField name="*_txt_ar" type="text_ar" indexed="true" stored="true"/>
553
+ <fieldType name="text_ar" class="solr.TextField" positionIncrementGap="100">
554
+ <analyzer>
555
+ <tokenizer class="solr.StandardTokenizerFactory"/>
556
+ <!-- for any non-arabic -->
557
+ <filter class="solr.LowerCaseFilterFactory"/>
558
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_ar.txt" />
559
+ <!-- normalizes ﻯ to ﻱ, etc -->
560
+ <filter class="solr.ArabicNormalizationFilterFactory"/>
561
+ <filter class="solr.ArabicStemFilterFactory"/>
562
+ </analyzer>
563
+ </fieldType>
564
+
565
+ <!-- Bulgarian -->
566
+ <dynamicField name="*_txt_bg" type="text_bg" indexed="true" stored="true"/>
567
+ <fieldType name="text_bg" class="solr.TextField" positionIncrementGap="100">
568
+ <analyzer>
569
+ <tokenizer class="solr.StandardTokenizerFactory"/>
570
+ <filter class="solr.LowerCaseFilterFactory"/>
571
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_bg.txt" />
572
+ <filter class="solr.BulgarianStemFilterFactory"/>
573
+ </analyzer>
574
+ </fieldType>
575
+
576
+ <!-- Catalan -->
577
+ <dynamicField name="*_txt_ca" type="text_ca" indexed="true" stored="true"/>
578
+ <fieldType name="text_ca" class="solr.TextField" positionIncrementGap="100">
579
+ <analyzer>
580
+ <tokenizer class="solr.StandardTokenizerFactory"/>
581
+ <!-- removes l', etc -->
582
+ <filter class="solr.ElisionFilterFactory" ignoreCase="true" articles="lang/contractions_ca.txt"/>
583
+ <filter class="solr.LowerCaseFilterFactory"/>
584
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_ca.txt" />
585
+ <filter class="solr.SnowballPorterFilterFactory" language="Catalan"/>
586
+ </analyzer>
587
+ </fieldType>
588
+
589
+ <!-- CJK bigram (see text_ja for a Japanese configuration using morphological analysis) -->
590
+ <dynamicField name="*_txt_cjk" type="text_cjk" indexed="true" stored="true"/>
591
+ <fieldType name="text_cjk" class="solr.TextField" positionIncrementGap="100">
592
+ <analyzer>
593
+ <tokenizer class="solr.StandardTokenizerFactory"/>
594
+ <!-- normalize width before bigram, as e.g. half-width dakuten combine -->
595
+ <filter class="solr.CJKWidthFilterFactory"/>
596
+ <!-- for any non-CJK -->
597
+ <filter class="solr.LowerCaseFilterFactory"/>
598
+ <filter class="solr.CJKBigramFilterFactory"/>
599
+ </analyzer>
600
+ </fieldType>
601
+
602
+ <!-- Czech -->
603
+ <dynamicField name="*_txt_cz" type="text_cz" indexed="true" stored="true"/>
604
+ <fieldType name="text_cz" class="solr.TextField" positionIncrementGap="100">
605
+ <analyzer>
606
+ <tokenizer class="solr.StandardTokenizerFactory"/>
607
+ <filter class="solr.LowerCaseFilterFactory"/>
608
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_cz.txt" />
609
+ <filter class="solr.CzechStemFilterFactory"/>
610
+ </analyzer>
611
+ </fieldType>
612
+
613
+ <!-- Danish -->
614
+ <dynamicField name="*_txt_da" type="text_da" indexed="true" stored="true"/>
615
+ <fieldType name="text_da" class="solr.TextField" positionIncrementGap="100">
616
+ <analyzer>
617
+ <tokenizer class="solr.StandardTokenizerFactory"/>
618
+ <filter class="solr.LowerCaseFilterFactory"/>
619
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_da.txt" format="snowball" />
620
+ <filter class="solr.SnowballPorterFilterFactory" language="Danish"/>
621
+ </analyzer>
622
+ </fieldType>
623
+
624
+ <!-- German -->
625
+ <dynamicField name="*_txt_de" type="text_de" indexed="true" stored="true"/>
626
+ <fieldType name="text_de" class="solr.TextField" positionIncrementGap="100">
627
+ <analyzer>
628
+ <tokenizer class="solr.StandardTokenizerFactory"/>
629
+ <filter class="solr.LowerCaseFilterFactory"/>
630
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_de.txt" format="snowball" />
631
+ <filter class="solr.GermanNormalizationFilterFactory"/>
632
+ <filter class="solr.GermanLightStemFilterFactory"/>
633
+ <!-- less aggressive: <filter class="solr.GermanMinimalStemFilterFactory"/> -->
634
+ <!-- more aggressive: <filter class="solr.SnowballPorterFilterFactory" language="German2"/> -->
635
+ </analyzer>
636
+ </fieldType>
637
+
638
+ <!-- Greek -->
639
+ <dynamicField name="*_txt_el" type="text_el" indexed="true" stored="true"/>
640
+ <fieldType name="text_el" class="solr.TextField" positionIncrementGap="100">
641
+ <analyzer>
642
+ <tokenizer class="solr.StandardTokenizerFactory"/>
643
+ <!-- greek specific lowercase for sigma -->
644
+ <filter class="solr.GreekLowerCaseFilterFactory"/>
645
+ <filter class="solr.StopFilterFactory" ignoreCase="false" words="lang/stopwords_el.txt" />
646
+ <filter class="solr.GreekStemFilterFactory"/>
647
+ </analyzer>
648
+ </fieldType>
649
+
650
+ <!-- Spanish -->
651
+ <dynamicField name="*_txt_es" type="text_es" indexed="true" stored="true"/>
652
+ <fieldType name="text_es" class="solr.TextField" positionIncrementGap="100">
653
+ <analyzer>
654
+ <tokenizer class="solr.StandardTokenizerFactory"/>
655
+ <filter class="solr.LowerCaseFilterFactory"/>
656
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_es.txt" format="snowball" />
657
+ <filter class="solr.SpanishLightStemFilterFactory"/>
658
+ <!-- more aggressive: <filter class="solr.SnowballPorterFilterFactory" language="Spanish"/> -->
659
+ </analyzer>
660
+ </fieldType>
661
+
662
+ <!-- Basque -->
663
+ <dynamicField name="*_txt_eu" type="text_eu" indexed="true" stored="true"/>
664
+ <fieldType name="text_eu" class="solr.TextField" positionIncrementGap="100">
665
+ <analyzer>
666
+ <tokenizer class="solr.StandardTokenizerFactory"/>
667
+ <filter class="solr.LowerCaseFilterFactory"/>
668
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_eu.txt" />
669
+ <filter class="solr.SnowballPorterFilterFactory" language="Basque"/>
670
+ </analyzer>
671
+ </fieldType>
672
+
673
+ <!-- Persian -->
674
+ <dynamicField name="*_txt_fa" type="text_fa" indexed="true" stored="true"/>
675
+ <fieldType name="text_fa" class="solr.TextField" positionIncrementGap="100">
676
+ <analyzer>
677
+ <!-- for ZWNJ -->
678
+ <charFilter class="solr.PersianCharFilterFactory"/>
679
+ <tokenizer class="solr.StandardTokenizerFactory"/>
680
+ <filter class="solr.LowerCaseFilterFactory"/>
681
+ <filter class="solr.ArabicNormalizationFilterFactory"/>
682
+ <filter class="solr.PersianNormalizationFilterFactory"/>
683
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_fa.txt" />
684
+ </analyzer>
685
+ </fieldType>
686
+
687
+ <!-- Finnish -->
688
+ <dynamicField name="*_txt_fi" type="text_fi" indexed="true" stored="true"/>
689
+ <fieldType name="text_fi" class="solr.TextField" positionIncrementGap="100">
690
+ <analyzer>
691
+ <tokenizer class="solr.StandardTokenizerFactory"/>
692
+ <filter class="solr.LowerCaseFilterFactory"/>
693
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_fi.txt" format="snowball" />
694
+ <filter class="solr.SnowballPorterFilterFactory" language="Finnish"/>
695
+ <!-- less aggressive: <filter class="solr.FinnishLightStemFilterFactory"/> -->
696
+ </analyzer>
697
+ </fieldType>
698
+
699
+ <!-- French -->
700
+ <dynamicField name="*_txt_fr" type="text_fr" indexed="true" stored="true"/>
701
+ <fieldType name="text_fr" class="solr.TextField" positionIncrementGap="100">
702
+ <analyzer>
703
+ <tokenizer class="solr.StandardTokenizerFactory"/>
704
+ <!-- removes l', etc -->
705
+ <filter class="solr.ElisionFilterFactory" ignoreCase="true" articles="lang/contractions_fr.txt"/>
706
+ <filter class="solr.LowerCaseFilterFactory"/>
707
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_fr.txt" format="snowball" />
708
+ <filter class="solr.FrenchLightStemFilterFactory"/>
709
+ <!-- less aggressive: <filter class="solr.FrenchMinimalStemFilterFactory"/> -->
710
+ <!-- more aggressive: <filter class="solr.SnowballPorterFilterFactory" language="French"/> -->
711
+ </analyzer>
712
+ </fieldType>
713
+
714
+ <!-- Irish -->
715
+ <dynamicField name="*_txt_ga" type="text_ga" indexed="true" stored="true"/>
716
+ <fieldType name="text_ga" class="solr.TextField" positionIncrementGap="100">
717
+ <analyzer>
718
+ <tokenizer class="solr.StandardTokenizerFactory"/>
719
+ <!-- removes d', etc -->
720
+ <filter class="solr.ElisionFilterFactory" ignoreCase="true" articles="lang/contractions_ga.txt"/>
721
+ <!-- removes n-, etc. position increments is intentionally false! -->
722
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/hyphenations_ga.txt"/>
723
+ <filter class="solr.IrishLowerCaseFilterFactory"/>
724
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_ga.txt"/>
725
+ <filter class="solr.SnowballPorterFilterFactory" language="Irish"/>
726
+ </analyzer>
727
+ </fieldType>
728
+
729
+ <!-- Galician -->
730
+ <dynamicField name="*_txt_gl" type="text_gl" indexed="true" stored="true"/>
731
+ <fieldType name="text_gl" class="solr.TextField" positionIncrementGap="100">
732
+ <analyzer>
733
+ <tokenizer class="solr.StandardTokenizerFactory"/>
734
+ <filter class="solr.LowerCaseFilterFactory"/>
735
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_gl.txt" />
736
+ <filter class="solr.GalicianStemFilterFactory"/>
737
+ <!-- less aggressive: <filter class="solr.GalicianMinimalStemFilterFactory"/> -->
738
+ </analyzer>
739
+ </fieldType>
740
+
741
+ <!-- Hindi -->
742
+ <dynamicField name="*_txt_hi" type="text_hi" indexed="true" stored="true"/>
743
+ <fieldType name="text_hi" class="solr.TextField" positionIncrementGap="100">
744
+ <analyzer>
745
+ <tokenizer class="solr.StandardTokenizerFactory"/>
746
+ <filter class="solr.LowerCaseFilterFactory"/>
747
+ <!-- normalizes unicode representation -->
748
+ <filter class="solr.IndicNormalizationFilterFactory"/>
749
+ <!-- normalizes variation in spelling -->
750
+ <filter class="solr.HindiNormalizationFilterFactory"/>
751
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_hi.txt" />
752
+ <filter class="solr.HindiStemFilterFactory"/>
753
+ </analyzer>
754
+ </fieldType>
755
+
756
+ <!-- Hungarian -->
757
+ <dynamicField name="*_txt_hu" type="text_hu" indexed="true" stored="true"/>
758
+ <fieldType name="text_hu" class="solr.TextField" positionIncrementGap="100">
759
+ <analyzer>
760
+ <tokenizer class="solr.StandardTokenizerFactory"/>
761
+ <filter class="solr.LowerCaseFilterFactory"/>
762
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_hu.txt" format="snowball" />
763
+ <filter class="solr.SnowballPorterFilterFactory" language="Hungarian"/>
764
+ <!-- less aggressive: <filter class="solr.HungarianLightStemFilterFactory"/> -->
765
+ </analyzer>
766
+ </fieldType>
767
+
768
+ <!-- Armenian -->
769
+ <dynamicField name="*_txt_hy" type="text_hy" indexed="true" stored="true"/>
770
+ <fieldType name="text_hy" class="solr.TextField" positionIncrementGap="100">
771
+ <analyzer>
772
+ <tokenizer class="solr.StandardTokenizerFactory"/>
773
+ <filter class="solr.LowerCaseFilterFactory"/>
774
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_hy.txt" />
775
+ <filter class="solr.SnowballPorterFilterFactory" language="Armenian"/>
776
+ </analyzer>
777
+ </fieldType>
778
+
779
+ <!-- Indonesian -->
780
+ <dynamicField name="*_txt_id" type="text_id" indexed="true" stored="true"/>
781
+ <fieldType name="text_id" class="solr.TextField" positionIncrementGap="100">
782
+ <analyzer>
783
+ <tokenizer class="solr.StandardTokenizerFactory"/>
784
+ <filter class="solr.LowerCaseFilterFactory"/>
785
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_id.txt" />
786
+ <!-- for a less aggressive approach (only inflectional suffixes), set stemDerivational to false -->
787
+ <filter class="solr.IndonesianStemFilterFactory" stemDerivational="true"/>
788
+ </analyzer>
789
+ </fieldType>
790
+
791
+ <!-- Italian -->
792
+ <dynamicField name="*_txt_it" type="text_it" indexed="true" stored="true"/>
793
+ <fieldType name="text_it" class="solr.TextField" positionIncrementGap="100">
794
+ <analyzer>
795
+ <tokenizer class="solr.StandardTokenizerFactory"/>
796
+ <!-- removes l', etc -->
797
+ <filter class="solr.ElisionFilterFactory" ignoreCase="true" articles="lang/contractions_it.txt"/>
798
+ <filter class="solr.LowerCaseFilterFactory"/>
799
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_it.txt" format="snowball" />
800
+ <filter class="solr.ItalianLightStemFilterFactory"/>
801
+ <!-- more aggressive: <filter class="solr.SnowballPorterFilterFactory" language="Italian"/> -->
802
+ </analyzer>
803
+ </fieldType>
804
+
805
+ <!-- Japanese using morphological analysis (see text_cjk for a configuration using bigramming)
806
+
807
+ NOTE: If you want to optimize search for precision, use default operator AND in your request
808
+ handler config (q.op) Use OR if you would like to optimize for recall (default).
809
+ -->
810
+ <dynamicField name="*_txt_ja" type="text_ja" indexed="true" stored="true"/>
811
+ <fieldType name="text_ja" class="solr.TextField" positionIncrementGap="100" autoGeneratePhraseQueries="false">
812
+ <analyzer>
813
+ <!-- Kuromoji Japanese morphological analyzer/tokenizer (JapaneseTokenizer)
814
+
815
+ Kuromoji has a search mode (default) that does segmentation useful for search. A heuristic
816
+ is used to segment compounds into its parts and the compound itself is kept as synonym.
817
+
818
+ Valid values for attribute mode are:
819
+ normal: regular segmentation
820
+ search: segmentation useful for search with synonyms compounds (default)
821
+ extended: same as search mode, but unigrams unknown words (experimental)
822
+
823
+ For some applications it might be good to use search mode for indexing and normal mode for
824
+ queries to reduce recall and prevent parts of compounds from being matched and highlighted.
825
+ Use <analyzer type="index"> and <analyzer type="query"> for this and mode normal in query.
826
+
827
+ Kuromoji also has a convenient user dictionary feature that allows overriding the statistical
828
+ model with your own entries for segmentation, part-of-speech tags and readings without a need
829
+ to specify weights. Notice that user dictionaries have not been subject to extensive testing.
830
+
831
+ User dictionary attributes are:
832
+ userDictionary: user dictionary filename
833
+ userDictionaryEncoding: user dictionary encoding (default is UTF-8)
834
+
835
+ See lang/userdict_ja.txt for a sample user dictionary file.
836
+
837
+ Punctuation characters are discarded by default. Use discardPunctuation="false" to keep them.
838
+ -->
839
+ <tokenizer class="solr.JapaneseTokenizerFactory" mode="search"/>
840
+ <!--<tokenizer class="solr.JapaneseTokenizerFactory" mode="search" userDictionary="lang/userdict_ja.txt"/>-->
841
+ <!-- Reduces inflected verbs and adjectives to their base/dictionary forms (辞書形) -->
842
+ <filter class="solr.JapaneseBaseFormFilterFactory"/>
843
+ <!-- Removes tokens with certain part-of-speech tags -->
844
+ <filter class="solr.JapanesePartOfSpeechStopFilterFactory" tags="lang/stoptags_ja.txt" />
845
+ <!-- Normalizes full-width romaji to half-width and half-width kana to full-width (Unicode NFKC subset) -->
846
+ <filter class="solr.CJKWidthFilterFactory"/>
847
+ <!-- Removes common tokens typically not useful for search, but have a negative effect on ranking -->
848
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_ja.txt" />
849
+ <!-- Normalizes common katakana spelling variations by removing any last long sound character (U+30FC) -->
850
+ <filter class="solr.JapaneseKatakanaStemFilterFactory" minimumLength="4"/>
851
+ <!-- Lower-cases romaji characters -->
852
+ <filter class="solr.LowerCaseFilterFactory"/>
853
+ </analyzer>
854
+ </fieldType>
855
+
856
+ <!-- Korean morphological analysis -->
857
+ <dynamicField name="*_txt_ko" type="text_ko" indexed="true" stored="true"/>
858
+ <fieldType name="text_ko" class="solr.TextField" positionIncrementGap="100">
859
+ <analyzer>
860
+ <!-- Nori Korean morphological analyzer/tokenizer (KoreanTokenizer)
861
+ The Korean (nori) analyzer integrates Lucene nori analysis module into Solr.
862
+ It uses the mecab-ko-dic dictionary to perform morphological analysis of Korean texts.
863
+
864
+ This dictionary was built with MeCab, it defines a format for the features adapted
865
+ for the Korean language.
866
+
867
+ Nori also has a convenient user dictionary feature that allows overriding the statistical
868
+ model with your own entries for segmentation, part-of-speech tags and readings without a need
869
+ to specify weights. Notice that user dictionaries have not been subject to extensive testing.
870
+
871
+ The tokenizer supports multiple schema attributes:
872
+ * userDictionary: User dictionary path.
873
+ * userDictionaryEncoding: User dictionary encoding.
874
+ * decompoundMode: Decompound mode. Either 'none', 'discard', 'mixed'. Default is 'discard'.
875
+ * outputUnknownUnigrams: If true outputs unigrams for unknown words.
876
+ -->
877
+ <tokenizer class="solr.KoreanTokenizerFactory" decompoundMode="discard" outputUnknownUnigrams="false"/>
878
+ <!-- Removes some part of speech stuff like EOMI (Pos.E), you can add a parameter 'tags',
879
+ listing the tags to remove. By default it removes:
880
+ E, IC, J, MAG, MAJ, MM, SP, SSC, SSO, SC, SE, XPN, XSA, XSN, XSV, UNA, NA, VSV
881
+ This is basically an equivalent to stemming.
882
+ -->
883
+ <filter class="solr.KoreanPartOfSpeechStopFilterFactory" />
884
+ <!-- Replaces term text with the Hangul transcription of Hanja characters, if applicable: -->
885
+ <filter class="solr.KoreanReadingFormFilterFactory" />
886
+ <filter class="solr.LowerCaseFilterFactory" />
887
+ </analyzer>
888
+ </fieldType>
889
+
890
+ <!-- Latvian -->
891
+ <dynamicField name="*_txt_lv" type="text_lv" indexed="true" stored="true"/>
892
+ <fieldType name="text_lv" class="solr.TextField" positionIncrementGap="100">
893
+ <analyzer>
894
+ <tokenizer class="solr.StandardTokenizerFactory"/>
895
+ <filter class="solr.LowerCaseFilterFactory"/>
896
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_lv.txt" />
897
+ <filter class="solr.LatvianStemFilterFactory"/>
898
+ </analyzer>
899
+ </fieldType>
900
+
901
+ <!-- Dutch -->
902
+ <dynamicField name="*_txt_nl" type="text_nl" indexed="true" stored="true"/>
903
+ <fieldType name="text_nl" class="solr.TextField" positionIncrementGap="100">
904
+ <analyzer>
905
+ <tokenizer class="solr.StandardTokenizerFactory"/>
906
+ <filter class="solr.LowerCaseFilterFactory"/>
907
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_nl.txt" format="snowball" />
908
+ <filter class="solr.StemmerOverrideFilterFactory" dictionary="lang/stemdict_nl.txt" ignoreCase="false"/>
909
+ <filter class="solr.SnowballPorterFilterFactory" language="Dutch"/>
910
+ </analyzer>
911
+ </fieldType>
912
+
913
+ <!-- Norwegian -->
914
+ <dynamicField name="*_txt_no" type="text_no" indexed="true" stored="true"/>
915
+ <fieldType name="text_no" class="solr.TextField" positionIncrementGap="100">
916
+ <analyzer>
917
+ <tokenizer class="solr.StandardTokenizerFactory"/>
918
+ <filter class="solr.LowerCaseFilterFactory"/>
919
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_no.txt" format="snowball" />
920
+ <filter class="solr.SnowballPorterFilterFactory" language="Norwegian"/>
921
+ <!-- less aggressive: <filter class="solr.NorwegianLightStemFilterFactory"/> -->
922
+ <!-- singular/plural: <filter class="solr.NorwegianMinimalStemFilterFactory"/> -->
923
+ </analyzer>
924
+ </fieldType>
925
+
926
+ <!-- Portuguese -->
927
+ <dynamicField name="*_txt_pt" type="text_pt" indexed="true" stored="true"/>
928
+ <fieldType name="text_pt" class="solr.TextField" positionIncrementGap="100">
929
+ <analyzer>
930
+ <tokenizer class="solr.StandardTokenizerFactory"/>
931
+ <filter class="solr.LowerCaseFilterFactory"/>
932
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_pt.txt" format="snowball" />
933
+ <filter class="solr.PortugueseLightStemFilterFactory"/>
934
+ <!-- less aggressive: <filter class="solr.PortugueseMinimalStemFilterFactory"/> -->
935
+ <!-- more aggressive: <filter class="solr.SnowballPorterFilterFactory" language="Portuguese"/> -->
936
+ <!-- most aggressive: <filter class="solr.PortugueseStemFilterFactory"/> -->
937
+ </analyzer>
938
+ </fieldType>
939
+
940
+ <!-- Romanian -->
941
+ <dynamicField name="*_txt_ro" type="text_ro" indexed="true" stored="true"/>
942
+ <fieldType name="text_ro" class="solr.TextField" positionIncrementGap="100">
943
+ <analyzer>
944
+ <tokenizer class="solr.StandardTokenizerFactory"/>
945
+ <filter class="solr.LowerCaseFilterFactory"/>
946
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_ro.txt" />
947
+ <filter class="solr.SnowballPorterFilterFactory" language="Romanian"/>
948
+ </analyzer>
949
+ </fieldType>
950
+
951
+ <!-- Russian -->
952
+ <dynamicField name="*_txt_ru" type="text_ru" indexed="true" stored="true"/>
953
+ <fieldType name="text_ru" class="solr.TextField" positionIncrementGap="100">
954
+ <analyzer>
955
+ <tokenizer class="solr.StandardTokenizerFactory"/>
956
+ <filter class="solr.LowerCaseFilterFactory"/>
957
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_ru.txt" format="snowball" />
958
+ <filter class="solr.SnowballPorterFilterFactory" language="Russian"/>
959
+ <!-- less aggressive: <filter class="solr.RussianLightStemFilterFactory"/> -->
960
+ </analyzer>
961
+ </fieldType>
962
+
963
+ <!-- Swedish -->
964
+ <dynamicField name="*_txt_sv" type="text_sv" indexed="true" stored="true"/>
965
+ <fieldType name="text_sv" class="solr.TextField" positionIncrementGap="100">
966
+ <analyzer>
967
+ <tokenizer class="solr.StandardTokenizerFactory"/>
968
+ <filter class="solr.LowerCaseFilterFactory"/>
969
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_sv.txt" format="snowball" />
970
+ <filter class="solr.SnowballPorterFilterFactory" language="Swedish"/>
971
+ <!-- less aggressive: <filter class="solr.SwedishLightStemFilterFactory"/> -->
972
+ </analyzer>
973
+ </fieldType>
974
+
975
+ <!-- Thai -->
976
+ <dynamicField name="*_txt_th" type="text_th" indexed="true" stored="true"/>
977
+ <fieldType name="text_th" class="solr.TextField" positionIncrementGap="100">
978
+ <analyzer>
979
+ <tokenizer class="solr.ThaiTokenizerFactory"/>
980
+ <filter class="solr.LowerCaseFilterFactory"/>
981
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_th.txt" />
982
+ </analyzer>
983
+ </fieldType>
984
+
985
+ <!-- Turkish -->
986
+ <dynamicField name="*_txt_tr" type="text_tr" indexed="true" stored="true"/>
987
+ <fieldType name="text_tr" class="solr.TextField" positionIncrementGap="100">
988
+ <analyzer>
989
+ <tokenizer class="solr.StandardTokenizerFactory"/>
990
+ <filter class="solr.TurkishLowerCaseFilterFactory"/>
991
+ <filter class="solr.StopFilterFactory" ignoreCase="false" words="lang/stopwords_tr.txt" />
992
+ <filter class="solr.SnowballPorterFilterFactory" language="Turkish"/>
993
+ </analyzer>
994
+ </fieldType>
995
+
996
+ <!-- Similarity is the scoring routine for each document vs. a query.
997
+ A custom Similarity or SimilarityFactory may be specified here, but
998
+ the default is fine for most applications.
999
+ For more info: http://lucene.apache.org/solr/guide/other-schema-elements.html#OtherSchemaElements-Similarity
1000
+ -->
1001
+ <!--
1002
+ <similarity class="com.example.solr.CustomSimilarityFactory">
1003
+ <str name="paramkey">param value</str>
1004
+ </similarity>
1005
+ -->
1006
+
1007
+ </schema>