chewy 0.8.4 → 7.3.4

Sign up to get free protection for your applications and to get access to all the features.
Files changed (340) hide show
  1. checksums.yaml +5 -5
  2. data/.github/CODEOWNERS +1 -0
  3. data/.github/ISSUE_TEMPLATE/bug_report.md +39 -0
  4. data/.github/ISSUE_TEMPLATE/feature_request.md +20 -0
  5. data/.github/PULL_REQUEST_TEMPLATE.md +16 -0
  6. data/.github/workflows/ruby.yml +74 -0
  7. data/.gitignore +1 -0
  8. data/.rubocop.yml +61 -0
  9. data/.rubocop_todo.yml +132 -0
  10. data/.yardopts +5 -0
  11. data/CHANGELOG.md +554 -245
  12. data/CODE_OF_CONDUCT.md +14 -0
  13. data/CONTRIBUTING.md +63 -0
  14. data/Gemfile +14 -11
  15. data/Guardfile +8 -6
  16. data/LICENSE.txt +1 -1
  17. data/README.md +748 -623
  18. data/Rakefile +11 -1
  19. data/chewy.gemspec +15 -19
  20. data/gemfiles/rails.5.2.activerecord.gemfile +11 -0
  21. data/gemfiles/rails.6.0.activerecord.gemfile +11 -0
  22. data/gemfiles/rails.6.1.activerecord.gemfile +13 -0
  23. data/gemfiles/rails.7.0.activerecord.gemfile +13 -0
  24. data/lib/chewy/config.rb +64 -50
  25. data/lib/chewy/errors.rb +10 -16
  26. data/lib/chewy/fields/base.rb +122 -32
  27. data/lib/chewy/fields/root.rb +48 -23
  28. data/lib/chewy/index/actions.rb +140 -54
  29. data/lib/chewy/index/adapter/active_record.rb +112 -0
  30. data/lib/chewy/{type → index}/adapter/base.rb +31 -12
  31. data/lib/chewy/index/adapter/object.rb +249 -0
  32. data/lib/chewy/index/adapter/orm.rb +194 -0
  33. data/lib/chewy/index/aliases.rb +14 -4
  34. data/lib/chewy/index/crutch.rb +40 -0
  35. data/lib/chewy/index/import/bulk_builder.rb +311 -0
  36. data/lib/chewy/index/import/bulk_request.rb +77 -0
  37. data/lib/chewy/index/import/journal_builder.rb +44 -0
  38. data/lib/chewy/index/import/routine.rb +139 -0
  39. data/lib/chewy/index/import.rb +243 -0
  40. data/lib/chewy/{type → index}/mapping.rb +79 -68
  41. data/lib/chewy/index/observe/active_record_methods.rb +87 -0
  42. data/lib/chewy/index/observe/callback.rb +34 -0
  43. data/lib/chewy/index/observe.rb +17 -0
  44. data/lib/chewy/index/settings.rb +10 -5
  45. data/lib/chewy/index/specification.rb +61 -0
  46. data/lib/chewy/index/syncer.rb +221 -0
  47. data/lib/chewy/{type → index}/witchcraft.rb +100 -39
  48. data/lib/chewy/index/wrapper.rb +95 -0
  49. data/lib/chewy/index.rb +216 -140
  50. data/lib/chewy/journal.rb +66 -0
  51. data/lib/chewy/log_subscriber.rb +8 -8
  52. data/lib/chewy/minitest/helpers.rb +150 -0
  53. data/lib/chewy/minitest/search_index_receiver.rb +76 -0
  54. data/lib/chewy/minitest.rb +1 -0
  55. data/lib/chewy/multi_search.rb +62 -0
  56. data/lib/chewy/railtie.rb +12 -25
  57. data/lib/chewy/rake_helper.rb +335 -37
  58. data/lib/chewy/repository.rb +2 -2
  59. data/lib/chewy/rspec/build_query.rb +12 -0
  60. data/lib/chewy/rspec/helpers.rb +55 -0
  61. data/lib/chewy/rspec/update_index.rb +106 -90
  62. data/lib/chewy/rspec.rb +3 -1
  63. data/lib/chewy/runtime/version.rb +4 -4
  64. data/lib/chewy/runtime.rb +1 -1
  65. data/lib/chewy/search/loader.rb +61 -0
  66. data/lib/chewy/{query → search}/pagination/kaminari.rb +13 -5
  67. data/lib/chewy/search/parameters/aggs.rb +16 -0
  68. data/lib/chewy/search/parameters/allow_partial_search_results.rb +27 -0
  69. data/lib/chewy/search/parameters/collapse.rb +16 -0
  70. data/lib/chewy/search/parameters/concerns/bool_storage.rb +24 -0
  71. data/lib/chewy/search/parameters/concerns/hash_storage.rb +23 -0
  72. data/lib/chewy/search/parameters/concerns/integer_storage.rb +14 -0
  73. data/lib/chewy/search/parameters/concerns/query_storage.rb +238 -0
  74. data/lib/chewy/search/parameters/concerns/string_array_storage.rb +23 -0
  75. data/lib/chewy/search/parameters/concerns/string_storage.rb +14 -0
  76. data/lib/chewy/search/parameters/docvalue_fields.rb +12 -0
  77. data/lib/chewy/search/parameters/explain.rb +16 -0
  78. data/lib/chewy/search/parameters/filter.rb +47 -0
  79. data/lib/chewy/search/parameters/highlight.rb +16 -0
  80. data/lib/chewy/search/parameters/ignore_unavailable.rb +27 -0
  81. data/lib/chewy/search/parameters/indices.rb +78 -0
  82. data/lib/chewy/search/parameters/indices_boost.rb +52 -0
  83. data/lib/chewy/search/parameters/limit.rb +17 -0
  84. data/lib/chewy/search/parameters/load.rb +32 -0
  85. data/lib/chewy/search/parameters/min_score.rb +16 -0
  86. data/lib/chewy/search/parameters/none.rb +25 -0
  87. data/lib/chewy/search/parameters/offset.rb +17 -0
  88. data/lib/chewy/search/parameters/order.rb +51 -0
  89. data/lib/chewy/search/parameters/post_filter.rb +19 -0
  90. data/lib/chewy/search/parameters/preference.rb +16 -0
  91. data/lib/chewy/search/parameters/profile.rb +16 -0
  92. data/lib/chewy/search/parameters/query.rb +19 -0
  93. data/lib/chewy/search/parameters/request_cache.rb +27 -0
  94. data/lib/chewy/search/parameters/rescore.rb +29 -0
  95. data/lib/chewy/search/parameters/script_fields.rb +16 -0
  96. data/lib/chewy/search/parameters/search_after.rb +20 -0
  97. data/lib/chewy/search/parameters/search_type.rb +16 -0
  98. data/lib/chewy/search/parameters/source.rb +77 -0
  99. data/lib/chewy/search/parameters/storage.rb +95 -0
  100. data/lib/chewy/search/parameters/stored_fields.rb +63 -0
  101. data/lib/chewy/search/parameters/suggest.rb +16 -0
  102. data/lib/chewy/search/parameters/terminate_after.rb +16 -0
  103. data/lib/chewy/search/parameters/timeout.rb +16 -0
  104. data/lib/chewy/search/parameters/track_scores.rb +16 -0
  105. data/lib/chewy/search/parameters/track_total_hits.rb +16 -0
  106. data/lib/chewy/search/parameters/version.rb +16 -0
  107. data/lib/chewy/search/parameters.rb +170 -0
  108. data/lib/chewy/search/query_proxy.rb +264 -0
  109. data/lib/chewy/search/request.rb +1071 -0
  110. data/lib/chewy/search/response.rb +119 -0
  111. data/lib/chewy/search/scoping.rb +49 -0
  112. data/lib/chewy/search/scrolling.rb +137 -0
  113. data/lib/chewy/search.rb +68 -28
  114. data/lib/chewy/stash.rb +68 -0
  115. data/lib/chewy/strategy/active_job.rb +3 -2
  116. data/lib/chewy/strategy/atomic.rb +2 -4
  117. data/lib/chewy/strategy/atomic_no_refresh.rb +18 -0
  118. data/lib/chewy/strategy/base.rb +13 -3
  119. data/lib/chewy/strategy/bypass.rb +1 -2
  120. data/lib/chewy/strategy/delayed_sidekiq/scheduler.rb +148 -0
  121. data/lib/chewy/strategy/delayed_sidekiq/worker.rb +52 -0
  122. data/lib/chewy/strategy/delayed_sidekiq.rb +17 -0
  123. data/lib/chewy/strategy/lazy_sidekiq.rb +64 -0
  124. data/lib/chewy/strategy/sidekiq.rb +15 -2
  125. data/lib/chewy/strategy/urgent.rb +1 -1
  126. data/lib/chewy/strategy.rb +16 -20
  127. data/lib/chewy/version.rb +1 -1
  128. data/lib/chewy.rb +81 -82
  129. data/lib/generators/chewy/install_generator.rb +3 -3
  130. data/lib/tasks/chewy.rake +99 -32
  131. data/migration_guide.md +56 -0
  132. data/spec/chewy/config_spec.rb +87 -15
  133. data/spec/chewy/fields/base_spec.rb +542 -233
  134. data/spec/chewy/fields/root_spec.rb +115 -17
  135. data/spec/chewy/fields/time_fields_spec.rb +13 -12
  136. data/spec/chewy/index/actions_spec.rb +595 -77
  137. data/spec/chewy/index/adapter/active_record_spec.rb +601 -0
  138. data/spec/chewy/index/adapter/object_spec.rb +243 -0
  139. data/spec/chewy/index/aliases_spec.rb +5 -5
  140. data/spec/chewy/index/import/bulk_builder_spec.rb +494 -0
  141. data/spec/chewy/index/import/bulk_request_spec.rb +95 -0
  142. data/spec/chewy/index/import/journal_builder_spec.rb +87 -0
  143. data/spec/chewy/index/import/routine_spec.rb +110 -0
  144. data/spec/chewy/index/import_spec.rb +615 -0
  145. data/spec/chewy/index/mapping_spec.rb +135 -0
  146. data/spec/chewy/index/observe/active_record_methods_spec.rb +68 -0
  147. data/spec/chewy/index/observe/callback_spec.rb +139 -0
  148. data/spec/chewy/index/observe_spec.rb +143 -0
  149. data/spec/chewy/index/settings_spec.rb +103 -50
  150. data/spec/chewy/index/specification_spec.rb +159 -0
  151. data/spec/chewy/index/syncer_spec.rb +118 -0
  152. data/spec/chewy/index/witchcraft_spec.rb +245 -0
  153. data/spec/chewy/index/wrapper_spec.rb +100 -0
  154. data/spec/chewy/index_spec.rb +149 -121
  155. data/spec/chewy/journal_spec.rb +223 -0
  156. data/spec/chewy/minitest/helpers_spec.rb +198 -0
  157. data/spec/chewy/minitest/search_index_receiver_spec.rb +118 -0
  158. data/spec/chewy/multi_search_spec.rb +84 -0
  159. data/spec/chewy/rake_helper_spec.rb +656 -0
  160. data/spec/chewy/repository_spec.rb +8 -8
  161. data/spec/chewy/rspec/build_query_spec.rb +34 -0
  162. data/spec/chewy/rspec/helpers_spec.rb +61 -0
  163. data/spec/chewy/rspec/update_index_spec.rb +220 -114
  164. data/spec/chewy/runtime_spec.rb +2 -2
  165. data/spec/chewy/search/loader_spec.rb +83 -0
  166. data/spec/chewy/search/pagination/kaminari_examples.rb +69 -0
  167. data/spec/chewy/search/pagination/kaminari_spec.rb +21 -0
  168. data/spec/chewy/search/parameters/aggs_spec.rb +5 -0
  169. data/spec/chewy/search/parameters/bool_storage_examples.rb +53 -0
  170. data/spec/chewy/search/parameters/collapse_spec.rb +5 -0
  171. data/spec/chewy/search/parameters/docvalue_fields_spec.rb +5 -0
  172. data/spec/chewy/search/parameters/explain_spec.rb +5 -0
  173. data/spec/chewy/search/parameters/filter_spec.rb +5 -0
  174. data/spec/chewy/search/parameters/hash_storage_examples.rb +59 -0
  175. data/spec/chewy/search/parameters/highlight_spec.rb +5 -0
  176. data/spec/chewy/search/parameters/ignore_unavailable_spec.rb +67 -0
  177. data/spec/chewy/search/parameters/indices_spec.rb +99 -0
  178. data/spec/chewy/search/parameters/integer_storage_examples.rb +32 -0
  179. data/spec/chewy/search/parameters/limit_spec.rb +5 -0
  180. data/spec/chewy/search/parameters/load_spec.rb +60 -0
  181. data/spec/chewy/search/parameters/min_score_spec.rb +32 -0
  182. data/spec/chewy/search/parameters/none_spec.rb +5 -0
  183. data/spec/chewy/search/parameters/offset_spec.rb +5 -0
  184. data/spec/chewy/search/parameters/order_spec.rb +72 -0
  185. data/spec/chewy/search/parameters/post_filter_spec.rb +5 -0
  186. data/spec/chewy/search/parameters/preference_spec.rb +5 -0
  187. data/spec/chewy/search/parameters/profile_spec.rb +5 -0
  188. data/spec/chewy/search/parameters/query_spec.rb +5 -0
  189. data/spec/chewy/search/parameters/query_storage_examples.rb +434 -0
  190. data/spec/chewy/search/parameters/request_cache_spec.rb +67 -0
  191. data/spec/chewy/search/parameters/rescore_spec.rb +62 -0
  192. data/spec/chewy/search/parameters/script_fields_spec.rb +5 -0
  193. data/spec/chewy/search/parameters/search_after_spec.rb +35 -0
  194. data/spec/chewy/search/parameters/search_type_spec.rb +5 -0
  195. data/spec/chewy/search/parameters/source_spec.rb +162 -0
  196. data/spec/chewy/search/parameters/storage_spec.rb +60 -0
  197. data/spec/chewy/search/parameters/stored_fields_spec.rb +126 -0
  198. data/spec/chewy/search/parameters/string_array_storage_examples.rb +63 -0
  199. data/spec/chewy/search/parameters/string_storage_examples.rb +32 -0
  200. data/spec/chewy/search/parameters/suggest_spec.rb +5 -0
  201. data/spec/chewy/search/parameters/terminate_after_spec.rb +5 -0
  202. data/spec/chewy/search/parameters/timeout_spec.rb +5 -0
  203. data/spec/chewy/search/parameters/track_scores_spec.rb +5 -0
  204. data/spec/chewy/search/parameters/track_total_hits_spec.rb +5 -0
  205. data/spec/chewy/search/parameters/version_spec.rb +5 -0
  206. data/spec/chewy/search/parameters_spec.rb +161 -0
  207. data/spec/chewy/search/query_proxy_spec.rb +119 -0
  208. data/spec/chewy/search/request_spec.rb +880 -0
  209. data/spec/chewy/search/response_spec.rb +202 -0
  210. data/spec/chewy/search/scrolling_spec.rb +171 -0
  211. data/spec/chewy/search_spec.rb +82 -55
  212. data/spec/chewy/stash_spec.rb +85 -0
  213. data/spec/chewy/strategy/active_job_spec.rb +27 -8
  214. data/spec/chewy/strategy/atomic_no_refresh_spec.rb +60 -0
  215. data/spec/chewy/strategy/atomic_spec.rb +13 -11
  216. data/spec/chewy/strategy/delayed_sidekiq_spec.rb +190 -0
  217. data/spec/chewy/strategy/lazy_sidekiq_spec.rb +214 -0
  218. data/spec/chewy/strategy/sidekiq_spec.rb +19 -7
  219. data/spec/chewy/strategy_spec.rb +19 -15
  220. data/spec/chewy_spec.rb +65 -88
  221. data/spec/spec_helper.rb +11 -20
  222. data/spec/support/active_record.rb +48 -6
  223. data/spec/support/class_helpers.rb +4 -19
  224. metadata +299 -183
  225. data/.travis.yml +0 -76
  226. data/Appraisals +0 -76
  227. data/gemfiles/rails.3.2.activerecord.gemfile +0 -15
  228. data/gemfiles/rails.3.2.activerecord.kaminari.gemfile +0 -14
  229. data/gemfiles/rails.3.2.activerecord.will_paginate.gemfile +0 -14
  230. data/gemfiles/rails.4.0.activerecord.gemfile +0 -15
  231. data/gemfiles/rails.4.0.activerecord.kaminari.gemfile +0 -14
  232. data/gemfiles/rails.4.0.activerecord.will_paginate.gemfile +0 -14
  233. data/gemfiles/rails.4.0.mongoid.4.0.0.gemfile +0 -15
  234. data/gemfiles/rails.4.0.mongoid.4.0.0.kaminari.gemfile +0 -14
  235. data/gemfiles/rails.4.0.mongoid.4.0.0.will_paginate.gemfile +0 -14
  236. data/gemfiles/rails.4.0.mongoid.5.1.0.gemfile +0 -15
  237. data/gemfiles/rails.4.0.mongoid.5.1.0.kaminari.gemfile +0 -14
  238. data/gemfiles/rails.4.0.mongoid.5.1.0.will_paginate.gemfile +0 -14
  239. data/gemfiles/rails.4.1.activerecord.gemfile +0 -15
  240. data/gemfiles/rails.4.1.activerecord.kaminari.gemfile +0 -14
  241. data/gemfiles/rails.4.1.activerecord.will_paginate.gemfile +0 -14
  242. data/gemfiles/rails.4.1.mongoid.4.0.0.gemfile +0 -15
  243. data/gemfiles/rails.4.1.mongoid.4.0.0.kaminari.gemfile +0 -14
  244. data/gemfiles/rails.4.1.mongoid.4.0.0.will_paginate.gemfile +0 -14
  245. data/gemfiles/rails.4.1.mongoid.5.1.0.gemfile +0 -15
  246. data/gemfiles/rails.4.1.mongoid.5.1.0.kaminari.gemfile +0 -14
  247. data/gemfiles/rails.4.1.mongoid.5.1.0.will_paginate.gemfile +0 -14
  248. data/gemfiles/rails.4.2.activerecord.gemfile +0 -16
  249. data/gemfiles/rails.4.2.activerecord.kaminari.gemfile +0 -15
  250. data/gemfiles/rails.4.2.activerecord.will_paginate.gemfile +0 -15
  251. data/gemfiles/rails.4.2.mongoid.4.0.0.gemfile +0 -15
  252. data/gemfiles/rails.4.2.mongoid.4.0.0.kaminari.gemfile +0 -14
  253. data/gemfiles/rails.4.2.mongoid.4.0.0.will_paginate.gemfile +0 -14
  254. data/gemfiles/rails.4.2.mongoid.5.1.0.gemfile +0 -15
  255. data/gemfiles/rails.4.2.mongoid.5.1.0.kaminari.gemfile +0 -14
  256. data/gemfiles/rails.4.2.mongoid.5.1.0.will_paginate.gemfile +0 -14
  257. data/gemfiles/rails.5.0.0.beta3.activerecord.gemfile +0 -16
  258. data/gemfiles/rails.5.0.0.beta3.activerecord.kaminari.gemfile +0 -16
  259. data/gemfiles/rails.5.0.0.beta3.activerecord.will_paginate.gemfile +0 -15
  260. data/gemfiles/sequel.4.31.gemfile +0 -13
  261. data/lib/chewy/backports/deep_dup.rb +0 -46
  262. data/lib/chewy/backports/duplicable.rb +0 -90
  263. data/lib/chewy/query/compose.rb +0 -69
  264. data/lib/chewy/query/criteria.rb +0 -181
  265. data/lib/chewy/query/filters.rb +0 -227
  266. data/lib/chewy/query/loading.rb +0 -111
  267. data/lib/chewy/query/nodes/and.rb +0 -25
  268. data/lib/chewy/query/nodes/base.rb +0 -17
  269. data/lib/chewy/query/nodes/bool.rb +0 -32
  270. data/lib/chewy/query/nodes/equal.rb +0 -34
  271. data/lib/chewy/query/nodes/exists.rb +0 -20
  272. data/lib/chewy/query/nodes/expr.rb +0 -28
  273. data/lib/chewy/query/nodes/field.rb +0 -106
  274. data/lib/chewy/query/nodes/has_child.rb +0 -14
  275. data/lib/chewy/query/nodes/has_parent.rb +0 -14
  276. data/lib/chewy/query/nodes/has_relation.rb +0 -61
  277. data/lib/chewy/query/nodes/match_all.rb +0 -11
  278. data/lib/chewy/query/nodes/missing.rb +0 -20
  279. data/lib/chewy/query/nodes/not.rb +0 -25
  280. data/lib/chewy/query/nodes/or.rb +0 -25
  281. data/lib/chewy/query/nodes/prefix.rb +0 -18
  282. data/lib/chewy/query/nodes/query.rb +0 -20
  283. data/lib/chewy/query/nodes/range.rb +0 -63
  284. data/lib/chewy/query/nodes/raw.rb +0 -15
  285. data/lib/chewy/query/nodes/regexp.rb +0 -31
  286. data/lib/chewy/query/nodes/script.rb +0 -20
  287. data/lib/chewy/query/pagination/will_paginate.rb +0 -27
  288. data/lib/chewy/query/pagination.rb +0 -16
  289. data/lib/chewy/query/scoping.rb +0 -20
  290. data/lib/chewy/query.rb +0 -1026
  291. data/lib/chewy/strategy/resque.rb +0 -26
  292. data/lib/chewy/type/actions.rb +0 -19
  293. data/lib/chewy/type/adapter/active_record.rb +0 -72
  294. data/lib/chewy/type/adapter/mongoid.rb +0 -58
  295. data/lib/chewy/type/adapter/object.rb +0 -89
  296. data/lib/chewy/type/adapter/orm.rb +0 -156
  297. data/lib/chewy/type/adapter/sequel.rb +0 -75
  298. data/lib/chewy/type/crutch.rb +0 -31
  299. data/lib/chewy/type/import.rb +0 -224
  300. data/lib/chewy/type/observe.rb +0 -76
  301. data/lib/chewy/type/wrapper.rb +0 -53
  302. data/lib/chewy/type.rb +0 -89
  303. data/lib/sequel/plugins/chewy_observe.rb +0 -78
  304. data/spec/chewy/query/criteria_spec.rb +0 -433
  305. data/spec/chewy/query/filters_spec.rb +0 -173
  306. data/spec/chewy/query/loading_spec.rb +0 -86
  307. data/spec/chewy/query/nodes/and_spec.rb +0 -16
  308. data/spec/chewy/query/nodes/bool_spec.rb +0 -22
  309. data/spec/chewy/query/nodes/equal_spec.rb +0 -32
  310. data/spec/chewy/query/nodes/exists_spec.rb +0 -18
  311. data/spec/chewy/query/nodes/has_child_spec.rb +0 -40
  312. data/spec/chewy/query/nodes/has_parent_spec.rb +0 -40
  313. data/spec/chewy/query/nodes/match_all_spec.rb +0 -11
  314. data/spec/chewy/query/nodes/missing_spec.rb +0 -15
  315. data/spec/chewy/query/nodes/not_spec.rb +0 -16
  316. data/spec/chewy/query/nodes/or_spec.rb +0 -16
  317. data/spec/chewy/query/nodes/prefix_spec.rb +0 -16
  318. data/spec/chewy/query/nodes/query_spec.rb +0 -12
  319. data/spec/chewy/query/nodes/range_spec.rb +0 -32
  320. data/spec/chewy/query/nodes/raw_spec.rb +0 -11
  321. data/spec/chewy/query/nodes/regexp_spec.rb +0 -31
  322. data/spec/chewy/query/nodes/script_spec.rb +0 -15
  323. data/spec/chewy/query/pagination/kaminari_spec.rb +0 -57
  324. data/spec/chewy/query/pagination/will_paginage_spec.rb +0 -60
  325. data/spec/chewy/query/pagination_spec.rb +0 -36
  326. data/spec/chewy/query_spec.rb +0 -632
  327. data/spec/chewy/strategy/resque_spec.rb +0 -40
  328. data/spec/chewy/type/actions_spec.rb +0 -31
  329. data/spec/chewy/type/adapter/active_record_spec.rb +0 -317
  330. data/spec/chewy/type/adapter/mongoid_spec.rb +0 -253
  331. data/spec/chewy/type/adapter/object_spec.rb +0 -139
  332. data/spec/chewy/type/adapter/sequel_spec.rb +0 -320
  333. data/spec/chewy/type/import_spec.rb +0 -433
  334. data/spec/chewy/type/mapping_spec.rb +0 -106
  335. data/spec/chewy/type/observe_spec.rb +0 -127
  336. data/spec/chewy/type/witchcraft_spec.rb +0 -154
  337. data/spec/chewy/type/wrapper_spec.rb +0 -58
  338. data/spec/chewy/type_spec.rb +0 -33
  339. data/spec/support/mongoid.rb +0 -81
  340. data/spec/support/sequel.rb +0 -75
@@ -0,0 +1,311 @@
1
+ module Chewy
2
+ class Index
3
+ module Import
4
+ # This class purpose is to build ES client-acceptable bulk
5
+ # request body from the passed objects for index and deletion.
6
+ # It handles parent-child relationships as well by fetching
7
+ # existing documents from ES and database, taking their join field values and
8
+ # using it in the bulk body.
9
+ # If fields are passed - it creates partial update entries except for
10
+ # the cases when the type has parent and parent_id has been changed.
11
+ class BulkBuilder
12
+ # @param index [Chewy::Index] desired index
13
+ # @param to_index [Array<Object>] objects to index
14
+ # @param delete [Array<Object>] objects or ids to delete
15
+ # @param fields [Array<Symbol, String>] and array of fields for documents update
16
+ def initialize(index, to_index: [], delete: [], fields: [])
17
+ @index = index
18
+ @to_index = to_index
19
+ @delete = delete
20
+ @fields = fields.map!(&:to_sym)
21
+ end
22
+
23
+ # Returns ES API-ready bulk requiest body.
24
+ # @see https://github.com/elastic/elasticsearch-ruby/blob/master/elasticsearch-api/lib/elasticsearch/api/actions/bulk.rb
25
+ # @return [Array<Hash>] bulk body
26
+ def bulk_body
27
+ populate_cache
28
+
29
+ @bulk_body ||= @to_index.flat_map(&method(:index_entry)).concat(
30
+ @delete.flat_map(&method(:delete_entry))
31
+ ).uniq
32
+ end
33
+
34
+ # The only purpose of this method is to cache document ids for
35
+ # all the passed object for index to avoid ids recalculation.
36
+ #
37
+ # @return [Hash[String => Object]] an ids-objects index hash
38
+ def index_objects_by_id
39
+ @index_objects_by_id ||= index_object_ids.invert.stringify_keys!
40
+ end
41
+
42
+ private
43
+
44
+ def crutches_for_index
45
+ @crutches_for_index ||= Chewy::Index::Crutch::Crutches.new @index, @to_index
46
+ end
47
+
48
+ def index_entry(object)
49
+ entry = {}
50
+ entry[:_id] = index_object_ids[object] if index_object_ids[object]
51
+ entry[:routing] = routing(object) if join_field?
52
+
53
+ parent = cache(entry[:_id])
54
+ data = data_for(object) if parent.present?
55
+ if parent.present? && parent_changed?(data, parent)
56
+ reindex_entries(object, data) + reindex_descendants(object)
57
+ elsif @fields.present?
58
+ return [] unless entry[:_id]
59
+
60
+ entry[:data] = {doc: data_for(object, fields: @fields)}
61
+ [{update: entry}]
62
+ else
63
+ entry[:data] = data || data_for(object)
64
+ [{index: entry}]
65
+ end
66
+ end
67
+
68
+ def reindex_entries(object, data, root: object)
69
+ entry = {}
70
+ entry[:_id] = index_object_ids[object] || entry_id(object)
71
+ entry[:data] = data
72
+ entry[:routing] = routing(root) || routing(object) if join_field?
73
+ delete = delete_single_entry(object, root: root).first
74
+ index = {index: entry}
75
+ [delete, index]
76
+ end
77
+
78
+ def reindex_descendants(root)
79
+ descendants = load_descendants(root)
80
+ crutches = Chewy::Index::Crutch::Crutches.new @index, [root, *descendants]
81
+ descendants.flat_map do |object|
82
+ reindex_entries(
83
+ object,
84
+ data_for(object, crutches: crutches),
85
+ root: root
86
+ )
87
+ end
88
+ end
89
+
90
+ def delete_entry(object)
91
+ delete_single_entry(object)
92
+ end
93
+
94
+ def delete_single_entry(object, root: object)
95
+ entry = {}
96
+ entry[:_id] = entry_id(object)
97
+ entry[:_id] ||= object.as_json
98
+
99
+ return [] if entry[:_id].blank?
100
+
101
+ if join_field?
102
+ cached_parent = cache(entry[:_id])
103
+ entry_parent_id =
104
+ if cached_parent
105
+ cached_parent[:parent_id]
106
+ else
107
+ find_parent_id(object)
108
+ end
109
+
110
+ entry[:routing] = existing_routing(root.try(:id)) || existing_routing(object.id)
111
+ entry[:parent] = entry_parent_id if entry_parent_id
112
+ end
113
+
114
+ [{delete: entry}]
115
+ end
116
+
117
+ def load_descendants(root)
118
+ root_type = join_field_type(root)
119
+ return [] unless root_type
120
+
121
+ descendant_ids = []
122
+ grouped_parents = {root_type => [root.id]}
123
+ # iteratively fetch all the descendants (with grouped_parents as a queue for next iteration)
124
+ until grouped_parents.empty?
125
+ children_data = grouped_parents.flat_map do |parent_type, parent_ids|
126
+ @index.query(
127
+ has_parent: {
128
+ parent_type: parent_type,
129
+ # ignore_unmapped to avoid error for the leaves of the tree
130
+ # (types without children)
131
+ ignore_unmapped: true,
132
+ query: {ids: {values: parent_ids}}
133
+ }
134
+ ).pluck(:_id, join_field).map { |id, join| [join['name'], id] }
135
+ end
136
+ descendant_ids |= children_data.map(&:last)
137
+
138
+ grouped_parents = {}
139
+ children_data.each do |name, id|
140
+ next unless name
141
+
142
+ grouped_parents[name] ||= []
143
+ grouped_parents[name] << id
144
+ end
145
+ end
146
+ # query the primary database to load the descentants' records
147
+ @index.adapter.load(descendant_ids, _index: @index.base_name, raw_import: @index._default_import_options[:raw_import])
148
+ end
149
+
150
+ def populate_cache
151
+ @cache = load_cache
152
+ end
153
+
154
+ def cache(id)
155
+ @cache[id.to_s]
156
+ end
157
+
158
+ def load_cache
159
+ return {} unless join_field?
160
+
161
+ @index
162
+ .filter(ids: {values: ids_for_cache})
163
+ .order('_doc')
164
+ .pluck(:_id, :_routing, join_field)
165
+ .map do |id, routing, join|
166
+ [
167
+ id,
168
+ {routing: routing, parent_id: join['parent']}
169
+ ]
170
+ end.to_h
171
+ end
172
+
173
+ def existing_routing(id)
174
+ # All objects needed here should be cached in #load_cache,
175
+ # if not, we return nil. In some cases we don't have existing routing cached,
176
+ # e.g. for loaded descendants
177
+ return unless cache(id)
178
+
179
+ cache(id)[:routing]
180
+ end
181
+
182
+ # Two types of ids:
183
+ # * of parents of the objects to be indexed
184
+ # * of objects to be deleted
185
+ def ids_for_cache
186
+ ids = @to_index.flat_map do |object|
187
+ [find_parent_id(object), object.id] if object.respond_to?(:id)
188
+ end
189
+ ids.concat(@delete.map do |object|
190
+ object.id if object.respond_to?(:id)
191
+ end)
192
+ ids.uniq.compact
193
+ end
194
+
195
+ def routing(object)
196
+ # filter out non-model objects, early return on object==nil
197
+ return unless object.respond_to?(:id)
198
+
199
+ parent_id = find_parent_id(object)
200
+ if parent_id
201
+ routing(index_objects_by_id[parent_id.to_s]) || existing_routing(parent_id)
202
+ else
203
+ object.id.to_s
204
+ end
205
+ end
206
+
207
+ def find_parent_id(object)
208
+ return unless object.respond_to?(:id)
209
+
210
+ join = data_for(object, fields: [join_field.to_sym])[join_field]
211
+ join['parent'] if join
212
+ end
213
+
214
+ def join_field
215
+ return @join_field if defined?(@join_field)
216
+
217
+ @join_field = find_join_field
218
+ end
219
+
220
+ def find_join_field
221
+ type_settings = @index.mappings_hash[:mappings]
222
+ return unless type_settings
223
+
224
+ properties = type_settings[:properties]
225
+ join_fields = properties.find { |_, options| options[:type] == :join }
226
+ return unless join_fields
227
+
228
+ join_fields.first.to_s
229
+ end
230
+
231
+ def join_field_type(object)
232
+ return unless join_field?
233
+
234
+ raw_object =
235
+ if @index._default_import_options[:raw_import]
236
+ @index._default_import_options[:raw_import].call(object.attributes)
237
+ else
238
+ object
239
+ end
240
+
241
+ join_field_value = data_for(
242
+ raw_object,
243
+ fields: [join_field.to_sym], # build only the field that is needed
244
+ crutches: Chewy::Index::Crutch::Crutches.new(@index, [raw_object])
245
+ )[join_field]
246
+
247
+ case join_field_value
248
+ when String
249
+ join_field_value
250
+ when Hash
251
+ join_field_value['name']
252
+ end
253
+ end
254
+
255
+ def join_field?
256
+ join_field && !join_field.empty?
257
+ end
258
+
259
+ def data_for(object, fields: [], crutches: crutches_for_index)
260
+ @index.compose(object, crutches, fields: fields)
261
+ end
262
+
263
+ def parent_changed?(data, old_parent)
264
+ return false unless old_parent
265
+ return false unless join_field?
266
+ return false unless @fields.include?(join_field.to_sym)
267
+ return false unless data.key?(join_field)
268
+
269
+ # The join field value can be a hash, e.g.:
270
+ # {"name": "child", "parent": "123"} for a child
271
+ # {"name": "parent"} for a parent
272
+ # but it can also be a string: (e.g. "parent") for a parent:
273
+ # https://www.elastic.co/guide/en/elasticsearch/reference/current/parent-join.html#parent-join
274
+ new_join_field_value = data[join_field]
275
+ if new_join_field_value.is_a? Hash
276
+ # If we have a hash in the join field,
277
+ # we're taking the `parent` field that holds the parent id.
278
+ new_parent_id = new_join_field_value['parent']
279
+ new_parent_id != old_parent[:parent_id]
280
+ else
281
+ # If there is a non-hash value (String or nil), it means that the join field is changed
282
+ # and the current object is no longer a child.
283
+ true
284
+ end
285
+ end
286
+
287
+ def entry_id(object)
288
+ if type_root.id
289
+ type_root.compose_id(object)
290
+ else
291
+ id = object.id if object.respond_to?(:id)
292
+ id ||= object[:id] || object['id'] if object.is_a?(Hash)
293
+ id = id.to_s if defined?(BSON) && id.is_a?(BSON::ObjectId)
294
+ id
295
+ end
296
+ end
297
+
298
+ def index_object_ids
299
+ @index_object_ids ||= @to_index.each_with_object({}) do |object, result|
300
+ id = entry_id(object)
301
+ result[object] = id if id.present?
302
+ end
303
+ end
304
+
305
+ def type_root
306
+ @type_root ||= @index.root
307
+ end
308
+ end
309
+ end
310
+ end
311
+ end
@@ -0,0 +1,77 @@
1
+ module Chewy
2
+ class Index
3
+ module Import
4
+ # Adds additional features to elasticsearch-api bulk method:
5
+ # * supports Chewy index suffix if necessary;
6
+ # * supports bulk_size, devides the passed body in chunks
7
+ # and peforms a separate request for each chunk;
8
+ # * returns only errored document entries from the response
9
+ # if any present.
10
+ #
11
+ # @see https://github.com/elastic/elasticsearch-ruby/blob/master/elasticsearch-api/lib/elasticsearch/api/actions/bulk.rb
12
+ class BulkRequest
13
+ # @param index [Chewy::Index] an index for the request
14
+ # @param suffix [String] an index name optional suffix
15
+ # @param bulk_size [Integer] bulk size in bytes
16
+ # @param bulk_options [Hash] options passed to the elasticsearch-api bulk method
17
+ def initialize(index, suffix: nil, bulk_size: nil, **bulk_options)
18
+ @index = index
19
+ @suffix = suffix
20
+ @bulk_size = bulk_size - 1.kilobyte if bulk_size # 1 kilobyte for request header and newlines
21
+ @bulk_options = bulk_options
22
+
23
+ raise ArgumentError, '`bulk_size` can\'t be less than 1 kilobyte' if @bulk_size && @bulk_size <= 0
24
+ end
25
+
26
+ # Performs a bulk request with the passed body, returns empty
27
+ # array if everything is fine and array filled with errored
28
+ # document entries if something went wrong.
29
+ #
30
+ # @param body [Array<Hash>] a standard bulk request body
31
+ # @return [Array<Hash>] an array of bulk errors
32
+ def perform(body)
33
+ return [] if body.blank?
34
+
35
+ request_bodies(body).each_with_object([]) do |request_body, results|
36
+ response = @index.client.bulk(**request_base.merge(body: request_body)) if request_body.present?
37
+
38
+ next unless response.try(:[], 'errors')
39
+
40
+ response_items = (response.try(:[], 'items') || [])
41
+ .select { |item| item.values.first['error'] }
42
+ results.concat(response_items)
43
+ end
44
+ end
45
+
46
+ private
47
+
48
+ def request_base
49
+ @request_base ||= {
50
+ index: @index.index_name(suffix: @suffix)
51
+ }.merge!(@bulk_options)
52
+ end
53
+
54
+ def request_bodies(body)
55
+ if @bulk_size
56
+ serializer = ::Elasticsearch::API.serializer
57
+ pieces = body.each_with_object(['']) do |piece, result|
58
+ operation, meta = piece.to_a.first
59
+ data = meta.delete(:data)
60
+ piece = serializer.dump(operation => meta)
61
+ piece << "\n" << serializer.dump(data) if data.present?
62
+
63
+ if result.last.bytesize + piece.bytesize > @bulk_size
64
+ result.push(piece)
65
+ else
66
+ result[-1].blank? ? (result[-1] = piece) : (result[-1] << "\n" << piece)
67
+ end
68
+ end
69
+ pieces.each { |piece| piece << "\n" }
70
+ else
71
+ [body]
72
+ end
73
+ end
74
+ end
75
+ end
76
+ end
77
+ end
@@ -0,0 +1,44 @@
1
+ module Chewy
2
+ class Index
3
+ module Import
4
+ class JournalBuilder
5
+ def initialize(index, to_index: [], delete: [])
6
+ @index = index
7
+ @to_index = to_index
8
+ @delete = delete
9
+ end
10
+
11
+ def bulk_body
12
+ Chewy::Index::Import::BulkBuilder.new(
13
+ Chewy::Stash::Journal,
14
+ to_index: [
15
+ entries(:index, @to_index),
16
+ entries(:delete, @delete)
17
+ ].compact
18
+ ).bulk_body.each do |item|
19
+ item.values.first.merge!(
20
+ _index: Chewy::Stash::Journal.index_name
21
+ )
22
+ end
23
+ end
24
+
25
+ private
26
+
27
+ def entries(action, objects)
28
+ return unless objects.present?
29
+
30
+ {
31
+ index_name: @index.derivable_name,
32
+ action: action,
33
+ references: identify(objects).map { |item| Base64.encode64(::Elasticsearch::API.serializer.dump(item)) },
34
+ created_at: Time.now.utc
35
+ }
36
+ end
37
+
38
+ def identify(objects)
39
+ @index.adapter.identify(objects)
40
+ end
41
+ end
42
+ end
43
+ end
44
+ end
@@ -0,0 +1,139 @@
1
+ module Chewy
2
+ class Index
3
+ module Import
4
+ # This class performs the import routine for the options and objects given.
5
+ #
6
+ # 0. Create target and journal indexes if needed.
7
+ # 1. Iterate over all the passed objects in batches.
8
+ # 2. For each batch {#process} method is called:
9
+ # * creates a bulk request body;
10
+ # * appends journal entries for the current batch to the request body;
11
+ # * prepends a leftovers bulk to the request body, which is calculated
12
+ # basing on the previous iteration errors;
13
+ # * performs the bulk request;
14
+ # * composes new leftovers bulk for the next iteration basing on the response errors if `update_failover` is true;
15
+ # * appends the rest of unfixable errors to the instance level errors array.
16
+ # 4. Perform the request for the last leftovers bulk if present using {#extract_leftovers}.
17
+ # 3. Return the result errors array.
18
+ #
19
+ # At the moment, it tries to restore only from the partial document update errors in cases
20
+ # when the document doesn't exist only if `update_failover` option is true. In order to
21
+ # restore, it indexes such an objects completely on the next iteration.
22
+ #
23
+ # @see Chewy::Index::Import::ClassMethods#import
24
+ class Routine
25
+ BULK_OPTIONS = %i[
26
+ suffix bulk_size
27
+ refresh timeout fields pipeline
28
+ consistency replication
29
+ wait_for_active_shards routing _source _source_exclude _source_include
30
+ ].freeze
31
+
32
+ DEFAULT_OPTIONS = {
33
+ refresh: true,
34
+ update_fields: [],
35
+ update_failover: true,
36
+ batch_size: Chewy::Index::Adapter::Base::BATCH_SIZE
37
+ }.freeze
38
+
39
+ attr_reader :options, :parallel_options, :errors, :stats, :leftovers
40
+
41
+ # Basically, processes passed options, extracting bulk request specific options.
42
+ # @param index [Chewy::Index] chewy index
43
+ # @param options [Hash] import options, see {Chewy::Index::Import::ClassMethods#import}
44
+ def initialize(index, **options)
45
+ @index = index
46
+ @options = options
47
+ @options.reverse_merge!(@index._default_import_options)
48
+ @options.reverse_merge!(journal: Chewy.configuration[:journal])
49
+ @options.reverse_merge!(DEFAULT_OPTIONS)
50
+ @bulk_options = @options.slice(*BULK_OPTIONS)
51
+ @parallel_options = @options.delete(:parallel)
52
+ if @parallel_options && !@parallel_options.is_a?(Hash)
53
+ @parallel_options = if @parallel_options.is_a?(Integer)
54
+ {in_processes: @parallel_options}
55
+ else
56
+ {}
57
+ end
58
+ end
59
+ @errors = []
60
+ @stats = {}
61
+ @leftovers = []
62
+ end
63
+
64
+ # Creates the journal index and the corresponding index if necessary.
65
+ # @return [Object] whatever
66
+ def create_indexes!
67
+ Chewy::Stash::Journal.create if @options[:journal] && !Chewy.configuration[:skip_journal_creation_on_import]
68
+ return if Chewy.configuration[:skip_index_creation_on_import]
69
+
70
+ @index.create!(**@bulk_options.slice(:suffix)) unless @index.exists?
71
+ end
72
+
73
+ # The main process method. Converts passed objects to the bulk request body,
74
+ # appends journal entries, performs this request and handles errors performing
75
+ # failover procedures if applicable.
76
+ #
77
+ # @param index [Array<Object>] any acceptable objects for indexing
78
+ # @param delete [Array<Object>] any acceptable objects for deleting
79
+ # @return [true, false] the result of the request, true if no errors
80
+ def process(index: [], delete: [])
81
+ bulk_builder = BulkBuilder.new(@index, to_index: index, delete: delete, fields: @options[:update_fields])
82
+ bulk_body = bulk_builder.bulk_body
83
+
84
+ if @options[:journal]
85
+ journal_builder = JournalBuilder.new(@index, to_index: index, delete: delete)
86
+ bulk_body.concat(journal_builder.bulk_body)
87
+ end
88
+
89
+ bulk_body.unshift(*flush_leftovers)
90
+
91
+ perform_bulk(bulk_body) do |response|
92
+ @leftovers = extract_leftovers(response, bulk_builder.index_objects_by_id)
93
+ @stats[:index] = @stats[:index].to_i + index.count if index.present?
94
+ @stats[:delete] = @stats[:delete].to_i + delete.count if delete.present?
95
+ end
96
+ end
97
+
98
+ # Performs a bulk request for the passed body.
99
+ #
100
+ # @param body [Array<Hash>] a standard bulk request body
101
+ # @return [true, false] the result of the request, true if no errors
102
+ def perform_bulk(body)
103
+ response = bulk.perform(body)
104
+ yield response if block_given?
105
+ Chewy.wait_for_status
106
+ @errors.concat(response)
107
+ response.blank?
108
+ end
109
+
110
+ private
111
+
112
+ def flush_leftovers
113
+ leftovers = @leftovers
114
+ @leftovers = []
115
+ leftovers
116
+ end
117
+
118
+ def extract_leftovers(errors, index_objects_by_id)
119
+ return [] unless @options[:update_fields].present? && @options[:update_failover] && errors.present?
120
+
121
+ failed_partial_updates = errors.select do |item|
122
+ item.keys.first == 'update' && item.values.first['error']['type'] == 'document_missing_exception'
123
+ end
124
+ failed_ids_hash = failed_partial_updates.index_by { |item| item.values.first['_id'].to_s }
125
+ failed_ids_for_reimport = failed_ids_hash.keys & index_objects_by_id.keys
126
+ errors_to_cleanup = failed_ids_hash.values_at(*failed_ids_for_reimport)
127
+ errors_to_cleanup.each { |error| errors.delete(error) }
128
+
129
+ failed_objects = index_objects_by_id.values_at(*failed_ids_for_reimport)
130
+ BulkBuilder.new(@index, to_index: failed_objects).bulk_body
131
+ end
132
+
133
+ def bulk
134
+ @bulk ||= BulkRequest.new(@index, **@bulk_options)
135
+ end
136
+ end
137
+ end
138
+ end
139
+ end