chewy 0.9.0 → 0.10.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (265) hide show
  1. checksums.yaml +4 -4
  2. data/.gitignore +1 -0
  3. data/.rubocop.yml +24 -2
  4. data/.rubocop_todo.yml +2 -2
  5. data/.travis.yml +38 -21
  6. data/.yardopts +5 -0
  7. data/Appraisals +55 -27
  8. data/CHANGELOG.md +57 -12
  9. data/Gemfile +14 -10
  10. data/LEGACY_DSL.md +497 -0
  11. data/README.md +249 -515
  12. data/chewy.gemspec +5 -4
  13. data/gemfiles/rails.4.0.activerecord.gemfile +14 -0
  14. data/gemfiles/rails.4.1.activerecord.gemfile +14 -0
  15. data/gemfiles/rails.4.2.activerecord.gemfile +8 -10
  16. data/gemfiles/rails.4.2.mongoid.5.1.gemfile +9 -10
  17. data/gemfiles/rails.5.0.activerecord.gemfile +8 -10
  18. data/gemfiles/rails.5.0.mongoid.6.0.gemfile +15 -0
  19. data/gemfiles/rails.5.1.activerecord.gemfile +15 -0
  20. data/gemfiles/rails.5.1.mongoid.6.1.gemfile +15 -0
  21. data/gemfiles/sequel.4.45.gemfile +11 -0
  22. data/lib/chewy.rb +77 -43
  23. data/lib/chewy/config.rb +44 -7
  24. data/lib/chewy/errors.rb +2 -2
  25. data/lib/chewy/fields/base.rb +39 -32
  26. data/lib/chewy/fields/root.rb +33 -7
  27. data/lib/chewy/index.rb +237 -149
  28. data/lib/chewy/index/actions.rb +85 -28
  29. data/lib/chewy/index/aliases.rb +2 -1
  30. data/lib/chewy/index/settings.rb +9 -5
  31. data/lib/chewy/index/specification.rb +58 -0
  32. data/lib/chewy/journal.rb +40 -92
  33. data/lib/chewy/query.rb +43 -27
  34. data/lib/chewy/query/compose.rb +13 -13
  35. data/lib/chewy/query/criteria.rb +13 -13
  36. data/lib/chewy/query/filters.rb +1 -1
  37. data/lib/chewy/query/loading.rb +1 -1
  38. data/lib/chewy/query/nodes/and.rb +2 -2
  39. data/lib/chewy/query/nodes/bool.rb +1 -1
  40. data/lib/chewy/query/nodes/equal.rb +2 -2
  41. data/lib/chewy/query/nodes/exists.rb +1 -1
  42. data/lib/chewy/query/nodes/has_relation.rb +2 -2
  43. data/lib/chewy/query/nodes/match_all.rb +1 -1
  44. data/lib/chewy/query/nodes/missing.rb +1 -1
  45. data/lib/chewy/query/nodes/not.rb +2 -2
  46. data/lib/chewy/query/nodes/or.rb +2 -2
  47. data/lib/chewy/query/nodes/prefix.rb +1 -1
  48. data/lib/chewy/query/nodes/query.rb +2 -2
  49. data/lib/chewy/query/nodes/range.rb +4 -4
  50. data/lib/chewy/query/nodes/regexp.rb +4 -4
  51. data/lib/chewy/query/nodes/script.rb +3 -3
  52. data/lib/chewy/query/pagination.rb +10 -1
  53. data/lib/chewy/railtie.rb +1 -0
  54. data/lib/chewy/rake_helper.rb +265 -48
  55. data/lib/chewy/rspec/update_index.rb +30 -22
  56. data/lib/chewy/search.rb +78 -21
  57. data/lib/chewy/search/loader.rb +83 -0
  58. data/lib/chewy/{query → search}/pagination/kaminari.rb +13 -5
  59. data/lib/chewy/search/pagination/will_paginate.rb +41 -0
  60. data/lib/chewy/search/parameters.rb +150 -0
  61. data/lib/chewy/search/parameters/aggs.rb +16 -0
  62. data/lib/chewy/search/parameters/concerns/bool_storage.rb +24 -0
  63. data/lib/chewy/search/parameters/concerns/hash_storage.rb +23 -0
  64. data/lib/chewy/search/parameters/concerns/integer_storage.rb +14 -0
  65. data/lib/chewy/search/parameters/concerns/query_storage.rb +237 -0
  66. data/lib/chewy/search/parameters/concerns/string_array_storage.rb +23 -0
  67. data/lib/chewy/search/parameters/concerns/string_storage.rb +14 -0
  68. data/lib/chewy/search/parameters/docvalue_fields.rb +12 -0
  69. data/lib/chewy/search/parameters/explain.rb +16 -0
  70. data/lib/chewy/search/parameters/filter.rb +47 -0
  71. data/lib/chewy/search/parameters/highlight.rb +16 -0
  72. data/lib/chewy/search/parameters/indices_boost.rb +52 -0
  73. data/lib/chewy/search/parameters/limit.rb +17 -0
  74. data/lib/chewy/search/parameters/load.rb +32 -0
  75. data/lib/chewy/search/parameters/min_score.rb +16 -0
  76. data/lib/chewy/search/parameters/none.rb +27 -0
  77. data/lib/chewy/search/parameters/offset.rb +17 -0
  78. data/lib/chewy/search/parameters/order.rb +64 -0
  79. data/lib/chewy/search/parameters/post_filter.rb +19 -0
  80. data/lib/chewy/search/parameters/preference.rb +16 -0
  81. data/lib/chewy/search/parameters/profile.rb +16 -0
  82. data/lib/chewy/search/parameters/query.rb +19 -0
  83. data/lib/chewy/search/parameters/request_cache.rb +27 -0
  84. data/lib/chewy/search/parameters/rescore.rb +29 -0
  85. data/lib/chewy/search/parameters/script_fields.rb +16 -0
  86. data/lib/chewy/search/parameters/search_after.rb +20 -0
  87. data/lib/chewy/search/parameters/search_type.rb +16 -0
  88. data/lib/chewy/search/parameters/source.rb +73 -0
  89. data/lib/chewy/search/parameters/storage.rb +95 -0
  90. data/lib/chewy/search/parameters/stored_fields.rb +63 -0
  91. data/lib/chewy/search/parameters/suggest.rb +16 -0
  92. data/lib/chewy/search/parameters/terminate_after.rb +16 -0
  93. data/lib/chewy/search/parameters/timeout.rb +16 -0
  94. data/lib/chewy/search/parameters/track_scores.rb +16 -0
  95. data/lib/chewy/search/parameters/types.rb +20 -0
  96. data/lib/chewy/search/parameters/version.rb +16 -0
  97. data/lib/chewy/search/query_proxy.rb +257 -0
  98. data/lib/chewy/search/request.rb +1021 -0
  99. data/lib/chewy/search/response.rb +119 -0
  100. data/lib/chewy/search/scoping.rb +50 -0
  101. data/lib/chewy/search/scrolling.rb +136 -0
  102. data/lib/chewy/stash.rb +70 -0
  103. data/lib/chewy/strategy.rb +10 -3
  104. data/lib/chewy/strategy/active_job.rb +1 -0
  105. data/lib/chewy/strategy/atomic.rb +1 -3
  106. data/lib/chewy/strategy/bypass.rb +1 -1
  107. data/lib/chewy/strategy/resque.rb +1 -0
  108. data/lib/chewy/strategy/shoryuken.rb +40 -0
  109. data/lib/chewy/strategy/sidekiq.rb +13 -3
  110. data/lib/chewy/type.rb +29 -7
  111. data/lib/chewy/type/actions.rb +26 -2
  112. data/lib/chewy/type/adapter/active_record.rb +44 -29
  113. data/lib/chewy/type/adapter/base.rb +27 -7
  114. data/lib/chewy/type/adapter/mongoid.rb +18 -7
  115. data/lib/chewy/type/adapter/object.rb +187 -26
  116. data/lib/chewy/type/adapter/orm.rb +59 -32
  117. data/lib/chewy/type/adapter/sequel.rb +32 -16
  118. data/lib/chewy/type/import.rb +145 -191
  119. data/lib/chewy/type/import/bulk_builder.rb +122 -0
  120. data/lib/chewy/type/import/bulk_request.rb +76 -0
  121. data/lib/chewy/type/import/journal_builder.rb +45 -0
  122. data/lib/chewy/type/import/routine.rb +138 -0
  123. data/lib/chewy/type/mapping.rb +11 -1
  124. data/lib/chewy/type/observe.rb +1 -1
  125. data/lib/chewy/type/syncer.rb +220 -0
  126. data/lib/chewy/type/witchcraft.rb +27 -13
  127. data/lib/chewy/type/wrapper.rb +28 -2
  128. data/lib/chewy/version.rb +1 -1
  129. data/lib/tasks/chewy.rake +84 -26
  130. data/spec/chewy/config_spec.rb +82 -1
  131. data/spec/chewy/fields/base_spec.rb +147 -112
  132. data/spec/chewy/fields/root_spec.rb +75 -18
  133. data/spec/chewy/fields/time_fields_spec.rb +2 -3
  134. data/spec/chewy/index/actions_spec.rb +180 -50
  135. data/spec/chewy/index/aliases_spec.rb +2 -2
  136. data/spec/chewy/index/settings_spec.rb +67 -38
  137. data/spec/chewy/index/specification_spec.rb +160 -0
  138. data/spec/chewy/index_spec.rb +57 -66
  139. data/spec/chewy/journal_spec.rb +149 -54
  140. data/spec/chewy/minitest/helpers_spec.rb +4 -4
  141. data/spec/chewy/minitest/search_index_receiver_spec.rb +1 -1
  142. data/spec/chewy/query/criteria_spec.rb +179 -179
  143. data/spec/chewy/query/filters_spec.rb +15 -15
  144. data/spec/chewy/query/loading_spec.rb +22 -20
  145. data/spec/chewy/query/nodes/and_spec.rb +2 -2
  146. data/spec/chewy/query/nodes/bool_spec.rb +4 -4
  147. data/spec/chewy/query/nodes/equal_spec.rb +19 -19
  148. data/spec/chewy/query/nodes/exists_spec.rb +6 -6
  149. data/spec/chewy/query/nodes/has_child_spec.rb +19 -19
  150. data/spec/chewy/query/nodes/has_parent_spec.rb +19 -19
  151. data/spec/chewy/query/nodes/missing_spec.rb +5 -5
  152. data/spec/chewy/query/nodes/not_spec.rb +3 -2
  153. data/spec/chewy/query/nodes/or_spec.rb +2 -2
  154. data/spec/chewy/query/nodes/prefix_spec.rb +5 -5
  155. data/spec/chewy/query/nodes/query_spec.rb +2 -2
  156. data/spec/chewy/query/nodes/range_spec.rb +18 -18
  157. data/spec/chewy/query/nodes/raw_spec.rb +1 -1
  158. data/spec/chewy/query/nodes/regexp_spec.rb +14 -14
  159. data/spec/chewy/query/nodes/script_spec.rb +4 -4
  160. data/spec/chewy/query/pagination/kaminari_spec.rb +3 -55
  161. data/spec/chewy/query/pagination/will_paginate_spec.rb +5 -0
  162. data/spec/chewy/query/pagination_spec.rb +25 -21
  163. data/spec/chewy/query_spec.rb +501 -560
  164. data/spec/chewy/rake_helper_spec.rb +368 -0
  165. data/spec/chewy/repository_spec.rb +4 -4
  166. data/spec/chewy/rspec/update_index_spec.rb +89 -56
  167. data/spec/chewy/runtime_spec.rb +2 -2
  168. data/spec/chewy/search/loader_spec.rb +117 -0
  169. data/spec/chewy/search/pagination/kaminari_examples.rb +71 -0
  170. data/spec/chewy/search/pagination/kaminari_spec.rb +17 -0
  171. data/spec/chewy/search/pagination/will_paginate_examples.rb +63 -0
  172. data/spec/chewy/search/pagination/will_paginate_spec.rb +17 -0
  173. data/spec/chewy/search/parameters/aggs_spec.rb +5 -0
  174. data/spec/chewy/search/parameters/bool_storage_examples.rb +53 -0
  175. data/spec/chewy/search/parameters/docvalue_fields_spec.rb +5 -0
  176. data/spec/chewy/search/parameters/explain_spec.rb +5 -0
  177. data/spec/chewy/search/parameters/filter_spec.rb +5 -0
  178. data/spec/chewy/search/parameters/hash_storage_examples.rb +59 -0
  179. data/spec/chewy/search/parameters/highlight_spec.rb +5 -0
  180. data/spec/chewy/search/parameters/indices_boost_spec.rb +83 -0
  181. data/spec/chewy/search/parameters/integer_storage_examples.rb +32 -0
  182. data/spec/chewy/search/parameters/limit_spec.rb +5 -0
  183. data/spec/chewy/search/parameters/load_spec.rb +60 -0
  184. data/spec/chewy/search/parameters/min_score_spec.rb +32 -0
  185. data/spec/chewy/search/parameters/none_spec.rb +5 -0
  186. data/spec/chewy/search/parameters/offset_spec.rb +5 -0
  187. data/spec/chewy/search/parameters/order_spec.rb +65 -0
  188. data/spec/chewy/search/parameters/post_filter_spec.rb +5 -0
  189. data/spec/chewy/search/parameters/preference_spec.rb +5 -0
  190. data/spec/chewy/search/parameters/profile_spec.rb +5 -0
  191. data/spec/chewy/search/parameters/query_spec.rb +5 -0
  192. data/spec/chewy/search/parameters/query_storage_examples.rb +388 -0
  193. data/spec/chewy/search/parameters/request_cache_spec.rb +67 -0
  194. data/spec/chewy/search/parameters/rescore_spec.rb +62 -0
  195. data/spec/chewy/search/parameters/script_fields_spec.rb +5 -0
  196. data/spec/chewy/search/parameters/search_after_spec.rb +32 -0
  197. data/spec/chewy/search/parameters/search_type_spec.rb +5 -0
  198. data/spec/chewy/search/parameters/source_spec.rb +156 -0
  199. data/spec/chewy/search/parameters/storage_spec.rb +60 -0
  200. data/spec/chewy/search/parameters/stored_fields_spec.rb +126 -0
  201. data/spec/chewy/search/parameters/string_array_storage_examples.rb +63 -0
  202. data/spec/chewy/search/parameters/string_storage_examples.rb +32 -0
  203. data/spec/chewy/search/parameters/suggest_spec.rb +5 -0
  204. data/spec/chewy/search/parameters/terminate_after_spec.rb +5 -0
  205. data/spec/chewy/search/parameters/timeout_spec.rb +5 -0
  206. data/spec/chewy/search/parameters/track_scores_spec.rb +5 -0
  207. data/spec/chewy/search/parameters/types_spec.rb +5 -0
  208. data/spec/chewy/search/parameters/version_spec.rb +5 -0
  209. data/spec/chewy/search/parameters_spec.rb +130 -0
  210. data/spec/chewy/search/query_proxy_spec.rb +68 -0
  211. data/spec/chewy/search/request_spec.rb +669 -0
  212. data/spec/chewy/search/response_spec.rb +192 -0
  213. data/spec/chewy/search/scrolling_spec.rb +169 -0
  214. data/spec/chewy/search_spec.rb +13 -6
  215. data/spec/chewy/stash_spec.rb +95 -0
  216. data/spec/chewy/strategy/active_job_spec.rb +6 -0
  217. data/spec/chewy/strategy/resque_spec.rb +6 -0
  218. data/spec/chewy/strategy/shoryuken_spec.rb +64 -0
  219. data/spec/chewy/strategy/sidekiq_spec.rb +8 -0
  220. data/spec/chewy/strategy_spec.rb +6 -6
  221. data/spec/chewy/type/actions_spec.rb +29 -10
  222. data/spec/chewy/type/adapter/active_record_spec.rb +203 -91
  223. data/spec/chewy/type/adapter/mongoid_spec.rb +112 -54
  224. data/spec/chewy/type/adapter/object_spec.rb +101 -28
  225. data/spec/chewy/type/adapter/sequel_spec.rb +149 -82
  226. data/spec/chewy/type/import/bulk_builder_spec.rb +279 -0
  227. data/spec/chewy/type/import/bulk_request_spec.rb +102 -0
  228. data/spec/chewy/type/import/journal_builder_spec.rb +95 -0
  229. data/spec/chewy/type/import/routine_spec.rb +110 -0
  230. data/spec/chewy/type/import_spec.rb +350 -271
  231. data/spec/chewy/type/mapping_spec.rb +54 -18
  232. data/spec/chewy/type/observe_spec.rb +5 -1
  233. data/spec/chewy/type/syncer_spec.rb +123 -0
  234. data/spec/chewy/type/witchcraft_spec.rb +45 -29
  235. data/spec/chewy/type/wrapper_spec.rb +63 -23
  236. data/spec/chewy/type_spec.rb +28 -7
  237. data/spec/chewy_spec.rb +75 -7
  238. data/spec/spec_helper.rb +5 -2
  239. data/spec/support/active_record.rb +5 -1
  240. data/spec/support/class_helpers.rb +0 -14
  241. data/spec/support/mongoid.rb +15 -3
  242. data/spec/support/sequel.rb +6 -1
  243. metadata +198 -37
  244. data/gemfiles/rails.3.2.activerecord.gemfile +0 -16
  245. data/gemfiles/rails.3.2.activerecord.kaminari.gemfile +0 -15
  246. data/gemfiles/rails.3.2.activerecord.will_paginate.gemfile +0 -15
  247. data/gemfiles/rails.4.2.activerecord.kaminari.gemfile +0 -16
  248. data/gemfiles/rails.4.2.activerecord.will_paginate.gemfile +0 -16
  249. data/gemfiles/rails.4.2.mongoid.4.0.gemfile +0 -16
  250. data/gemfiles/rails.4.2.mongoid.4.0.kaminari.gemfile +0 -15
  251. data/gemfiles/rails.4.2.mongoid.4.0.will_paginate.gemfile +0 -15
  252. data/gemfiles/rails.4.2.mongoid.5.1.kaminari.gemfile +0 -15
  253. data/gemfiles/rails.4.2.mongoid.5.1.will_paginate.gemfile +0 -15
  254. data/gemfiles/rails.5.0.activerecord.kaminari.gemfile +0 -16
  255. data/gemfiles/rails.5.0.activerecord.will_paginate.gemfile +0 -16
  256. data/gemfiles/sequel.4.38.gemfile +0 -14
  257. data/lib/chewy/journal/apply.rb +0 -31
  258. data/lib/chewy/journal/clean.rb +0 -24
  259. data/lib/chewy/journal/entry.rb +0 -83
  260. data/lib/chewy/journal/query.rb +0 -87
  261. data/lib/chewy/query/pagination/will_paginate.rb +0 -27
  262. data/lib/chewy/query/scoping.rb +0 -20
  263. data/spec/chewy/journal/apply_spec.rb +0 -120
  264. data/spec/chewy/journal/entry_spec.rb +0 -237
  265. data/spec/chewy/query/pagination/will_paginage_spec.rb +0 -59
@@ -0,0 +1,119 @@
1
+ module Chewy
2
+ module Search
3
+ # This class is a ES response hash wrapper.
4
+ #
5
+ # @see https://www.elastic.co/guide/en/elasticsearch/reference/current/_the_search_api.html
6
+ class Response
7
+ # @param body [Hash] response body hash
8
+ # @param loader [Chewy::Search::Loader] loader instance
9
+ def initialize(body, loader, paginator = nil)
10
+ @body = body
11
+ @loader = loader
12
+ @paginator = paginator
13
+ end
14
+
15
+ # Raw response `hits` collection. Returns empty array is something went wrong.
16
+ #
17
+ # @return [Array<Hash>]
18
+ def hits
19
+ @hits ||= hits_root['hits'] || []
20
+ end
21
+
22
+ # Response `total` field. Returns `0` if something went wrong.
23
+ #
24
+ # @return [Integer]
25
+ def total
26
+ @total ||= hits_root['total'] || 0
27
+ end
28
+
29
+ # Response `max_score` field.
30
+ #
31
+ # @return [Float]
32
+ def max_score
33
+ @max_score ||= hits_root['max_score']
34
+ end
35
+
36
+ # Duration of the request handling in ms according to ES.
37
+ #
38
+ # @return [Integer]
39
+ def took
40
+ @took ||= @body['took']
41
+ end
42
+
43
+ # Has the request been timed out?
44
+ #
45
+ # @return [true, false]
46
+ def timed_out?
47
+ @timed_out ||= @body['timed_out']
48
+ end
49
+
50
+ # The `suggest` response part. Returns empty hash if suggests
51
+ # were not requested.
52
+ #
53
+ # @return [Hash]
54
+ def suggest
55
+ @suggest ||= @body['suggest'] || {}
56
+ end
57
+
58
+ # The `aggregations` response part. Returns empty hash if aggregations
59
+ # were not requested.
60
+ #
61
+ # @return [Hash]
62
+ def aggs
63
+ @aggs ||= @body['aggregations'] || {}
64
+ end
65
+ alias_method :aggregations, :aggs
66
+
67
+ # {Chewy::Type} wrappers collection instantiated on top of hits.
68
+ #
69
+ # @return [Array<Chewy::Type>]
70
+ def wrappers
71
+ @wrappers ||= hits.map do |hit|
72
+ @loader.derive_type(hit['_index'], hit['_type']).build(hit)
73
+ end
74
+ end
75
+
76
+ # ORM/ODM objects that had been a source for Chewy import
77
+ # and now loaded from the DB using hits ids. Uses
78
+ # {Chewy::Search::Request#load} passed options for loading.
79
+ #
80
+ # @see Chewy::Search::Request#load
81
+ # @see Chewy::Search::Loader
82
+ # @return [Array<Object>]
83
+ def objects
84
+ @objects ||= begin
85
+ objects = @loader.load(hits)
86
+ if @paginator
87
+ @paginator.call(objects)
88
+ else
89
+ objects
90
+ end
91
+ end
92
+ end
93
+ alias_method :records, :objects
94
+ alias_method :documents, :objects
95
+
96
+ # This method is used in cases when you need to iterate through
97
+ # both of the collections simultaneously.
98
+ #
99
+ # @example
100
+ # scope.each do |wrapper|
101
+ # scope.object_hash[wrapper]
102
+ # end
103
+ # @see #wrappers
104
+ # @see #objects
105
+ # @return [{Chewy::Type => Object}] a hash with wrappers as keys and ORM/ODM objects as values
106
+ def object_hash
107
+ @object_hash ||= wrappers.zip(objects).to_h
108
+ end
109
+ alias_method :record_hash, :object_hash
110
+ alias_method :document_hash, :object_hash
111
+
112
+ private
113
+
114
+ def hits_root
115
+ @body.fetch('hits', {})
116
+ end
117
+ end
118
+ end
119
+ end
@@ -0,0 +1,50 @@
1
+ module Chewy
2
+ module Search
3
+ # This module along with {Chewy::Search} provides an ability to
4
+ # use names scopes.
5
+ #
6
+ # @example
7
+ # class UsersIndex < Chewy::Index
8
+ # def self.by_name(name)
9
+ # query(match: {name: name})
10
+ # end
11
+ #
12
+ # define_type :user do
13
+ # def self.by_age(age)
14
+ # filter(term: {age: age})
15
+ # end
16
+ # end
17
+ # end
18
+ #
19
+ # UsersIndex.limit(10).by_name('Martin')
20
+ # # => <UsersIndex::Query {..., :body=>{:size=>10, :query=>{:match=>{:name=>"Martin"}}}}>
21
+ # UsersIndex::User.limit(10).by_name('Martin').by_age(42)
22
+ # # => <UsersIndex::User::Query {..., :body=>{:size=>10, :query=>{:bool=>{
23
+ # # :must=>{:match=>{:name=>"Martin"}},
24
+ # # :filter=>{:term=>{:age=>42}}}}}}>
25
+ module Scoping
26
+ extend ActiveSupport::Concern
27
+
28
+ module ClassMethods
29
+ # The scopes stack.
30
+ #
31
+ # @return [Array<Chewy::Search::Reques>] array of scopes
32
+ def scopes
33
+ Thread.current[:chewy_scopes] ||= []
34
+ end
35
+ end
36
+
37
+ # Wraps any method to make it contents be executed inside the
38
+ # current request scope.
39
+ #
40
+ # @see Chewy::Search::ClassMethods#all
41
+ # @yield executes the block after the current context is put at the top of the scope stack
42
+ def scoping
43
+ self.class.scopes.push(self)
44
+ yield
45
+ ensure
46
+ self.class.scopes.pop
47
+ end
48
+ end
49
+ end
50
+ end
@@ -0,0 +1,136 @@
1
+ module Chewy
2
+ module Search
3
+ # This module contains batch requests DSL via ES scroll API. All the methods
4
+ # are optimized on memory consumption, they are not caching anythig, so
5
+ # use them when you need to do some single-run stuff on a huge amount of
6
+ # documents. Don't forget to tune the `scroll` parameter for long-lasting
7
+ # actions.
8
+ # All the scroll methods respect the limit value if provided.
9
+ #
10
+ # @see https://www.elastic.co/guide/en/elasticsearch/reference/current/search-request-scroll.html
11
+ module Scrolling
12
+ # Iterates through the documents of the scope in batches. Limit if overrided
13
+ # by the `batch_size`. There are 2 possible use-cases: with a block or without.
14
+ #
15
+ # @param batch_size [Integer] batch size obviously, replaces `size` query parameter
16
+ # @param scroll [String] cursor expiration time
17
+ #
18
+ # @overload scroll_batches(batch_size: 1000, scroll: '1m')
19
+ # @example
20
+ # PlaceIndex.scroll_batches { |batch| batch.each { |hit| p hit['_id'] } }
21
+ # @yieldparam batch [Array<Hash>] block is executed for each batch of hits
22
+ #
23
+ # @overload scroll_batches(batch_size: 1000, scroll: '1m')
24
+ # @example
25
+ # PlaceIndex.scroll_batches.flat_map { |batch| batch.map { |hit| hit['_id'] } }
26
+ # @return [Enumerator] a standard ruby Enumerator
27
+ def scroll_batches(batch_size: Request::DEFAULT_BATCH_SIZE, scroll: Request::DEFAULT_SCROLL)
28
+ return enum_for(:scroll_batches, batch_size: batch_size, scroll: scroll) unless block_given?
29
+
30
+ result = perform(size: batch_size, scroll: scroll)
31
+ total = [raw_limit_value, result.fetch('hits', {}).fetch('total', 0)].compact.min
32
+ last_batch_size = total % batch_size
33
+ fetched = 0
34
+
35
+ loop do
36
+ hits = result.fetch('hits', {}).fetch('hits', [])
37
+ fetched += hits.size
38
+ hits = hits.first(last_batch_size) if last_batch_size != 0 && fetched >= total
39
+ yield(hits) if hits.present?
40
+ break if fetched >= total
41
+ scroll_id = result['_scroll_id']
42
+ result = perform_scroll(scroll: scroll, scroll_id: scroll_id)
43
+ end
44
+ end
45
+
46
+ # @!method scroll_hits(batch_size: 1000, scroll: '1m')
47
+ # Iterates through the documents of the scope in batches. Yields each hit separately.
48
+ #
49
+ # @param batch_size [Integer] batch size obviously, replaces `size` query parameter
50
+ # @param scroll [String] cursor expiration time
51
+ #
52
+ # @overload scroll_hits(batch_size: 1000, scroll: '1m')
53
+ # @example
54
+ # PlaceIndex.scroll_hits { |hit| p hit['_id'] }
55
+ # @yieldparam hit [Hash] block is executed for each hit
56
+ #
57
+ # @overload scroll_hits(batch_size: 1000, scroll: '1m')
58
+ # @example
59
+ # PlaceIndex.scroll_hits.map { |hit| hit['_id'] }
60
+ # @return [Enumerator] a standard ruby Enumerator
61
+ def scroll_hits(**options)
62
+ return enum_for(:scroll_hits, **options) unless block_given?
63
+
64
+ scroll_batches(**options).each do |batch|
65
+ batch.each { |hit| yield hit }
66
+ end
67
+ end
68
+
69
+ # @!method scroll_wrappers(batch_size: 1000, scroll: '1m')
70
+ # Iterates through the documents of the scope in batches. Yields
71
+ # each hit wrapped with {Chewy::Type}.
72
+ #
73
+ # @param batch_size [Integer] batch size obviously, replaces `size` query parameter
74
+ # @param scroll [String] cursor expiration time
75
+ #
76
+ # @overload scroll_wrappers(batch_size: 1000, scroll: '1m')
77
+ # @example
78
+ # PlaceIndex.scroll_wrappers { |object| p object.id }
79
+ # @yieldparam object [Chewy::Type] block is executed for each hit object
80
+ #
81
+ # @overload scroll_wrappers(batch_size: 1000, scroll: '1m')
82
+ # @example
83
+ # PlaceIndex.scroll_wrappers.map { |object| object.id }
84
+ # @return [Enumerator] a standard ruby Enumerator
85
+ def scroll_wrappers(**options)
86
+ return enum_for(:scroll_wrappers, **options) unless block_given?
87
+
88
+ scroll_hits(**options).each do |hit|
89
+ yield loader.derive_type(hit['_index'], hit['_type']).build(hit)
90
+ end
91
+ end
92
+
93
+ # @!method scroll_objects(batch_size: 1000, scroll: '1m')
94
+ # Iterates through the documents of the scope in batches. Performs load
95
+ # operation for each batch and then yields each loaded ORM/ODM object.
96
+ # Uses {Chewy::Search::Request#load} passed options for loading.
97
+ #
98
+ # @note If the record is not found it yields nil instead.
99
+ # @see Chewy::Search::Request#load
100
+ # @see Chewy::Search::Loader
101
+ # @param batch_size [Integer] batch size obviously, replaces `size` query parameter
102
+ # @param scroll [String] cursor expiration time
103
+ #
104
+ # @overload scroll_objects(batch_size: 1000, scroll: '1m')
105
+ # @example
106
+ # PlaceIndex.scroll_objects { |record| p record.id }
107
+ # @yieldparam record [Object] block is executed for each record loaded
108
+ #
109
+ # @overload scroll_objects(batch_size: 1000, scroll: '1m')
110
+ # @example
111
+ # PlaceIndex.scroll_objects.map { |record| record.id }
112
+ # @return [Enumerator] a standard ruby Enumerator
113
+ def scroll_objects(**options)
114
+ return enum_for(:scroll_objects, **options) unless block_given?
115
+
116
+ except(:source, :stored_fields, :script_fields, :docvalue_fields)
117
+ .source(false).scroll_batches(**options).each do |batch|
118
+ loader.load(batch).each { |object| yield object }
119
+ end
120
+ end
121
+ alias_method :scroll_records, :scroll_objects
122
+ alias_method :scroll_documents, :scroll_objects
123
+
124
+ private
125
+
126
+ def perform_scroll(body)
127
+ ActiveSupport::Notifications.instrument 'search_query.chewy',
128
+ request: body, indexes: _indexes, types: _types,
129
+ index: _indexes.one? ? _indexes.first : _indexes,
130
+ type: _types.one? ? _types.first : _types do
131
+ Chewy.client.scroll(body)
132
+ end
133
+ end
134
+ end
135
+ end
136
+ end
@@ -0,0 +1,70 @@
1
+ module Chewy
2
+ # This class is the main storage for Chewy service data,
3
+ # Now index raw specifications are stored in the `chewy_stash`
4
+ # index. In the future the journal will be moved here as well.
5
+ #
6
+ # @see Chewy::Index::Specification
7
+ class Stash < Chewy::Index
8
+ index_name 'chewy_stash'
9
+
10
+ define_type :specification do
11
+ default_import_options journal: false
12
+
13
+ field :value, index: 'no'
14
+ end
15
+
16
+ define_type :journal do # rubocop:disable Metrics/BlockLength
17
+ default_import_options journal: false
18
+
19
+ field :index_name, type: 'string', index: 'not_analyzed'
20
+ field :type_name, type: 'string', index: 'not_analyzed'
21
+ field :action, type: 'string', index: 'not_analyzed'
22
+ field :references, type: 'string', index: 'no'
23
+ field :created_at, type: 'date'
24
+
25
+ # Loads all entries since the specified time.
26
+ #
27
+ # @param since_time [Time, DateTime] a timestamp from which we load a journal
28
+ # @param only [Chewy::Index, Array<Chewy::Index>] journal entries related to these indices will be loaded only
29
+ def self.entries(since_time, only: [])
30
+ self.for(only).filter(range: {created_at: {gt: since_time}})
31
+ end
32
+
33
+ # Cleans up all the journal entries until the specified time. If nothing is
34
+ # specified - cleans up everything.
35
+ #
36
+ # @param since_time [Time, DateTime] the time top boundary
37
+ # @param only [Chewy::Index, Array<Chewy::Index>] indexes to clean up journal entries for
38
+ def self.clean(until_time = nil, only: [])
39
+ scope = self.for(only)
40
+ scope = scope.filter(range: {created_at: {lte: until_time}}) if until_time
41
+ scope.delete_all
42
+ end
43
+
44
+ # Selects all the journal entries for the specified indices.
45
+ #
46
+ # @param indices [Chewy::Index, Array<Chewy::Index>]
47
+ def self.for(*something)
48
+ something = something.flatten.compact
49
+ types = something.flat_map { |s| Chewy.derive_types(s) }
50
+ return none if something.present? && types.blank?
51
+ scope = all
52
+ types.group_by(&:index).each do |index, index_types|
53
+ scope = scope.or(
54
+ filter(term: {index_name: index.derivable_name})
55
+ .filter(terms: {type_name: index_types.map(&:type_name)})
56
+ )
57
+ end
58
+ scope
59
+ end
60
+
61
+ def type
62
+ @type ||= Chewy.derive_type("#{index_name}##{type_name}")
63
+ end
64
+
65
+ def references
66
+ @references ||= Array.wrap(@attributes['references']).map { |r| JSON.load(r) } # rubocop:disable Security/JSONLoad
67
+ end
68
+ end
69
+ end
70
+ end
@@ -17,6 +17,13 @@ rescue LoadError
17
17
  nil
18
18
  end
19
19
 
20
+ begin
21
+ require 'shoryuken'
22
+ require 'chewy/strategy/shoryuken'
23
+ rescue LoadError
24
+ nil
25
+ end
26
+
20
27
  begin
21
28
  require 'active_job'
22
29
  require 'chewy/strategy/active_job'
@@ -47,14 +54,14 @@ module Chewy
47
54
 
48
55
  def push(name)
49
56
  result = @stack.push resolve(name).new
50
- debug "[#{@stack.size}] <- #{current.name}"
57
+ debug "[#{@stack.size - 1}] <- #{current.name}" if @stack.size > 2
51
58
  result
52
59
  end
53
60
 
54
61
  def pop
55
62
  raise "Can't pop root strategy" if @stack.one?
56
- debug "[#{@stack.size}] -> #{current.name}"
57
63
  result = @stack.pop.tap(&:leave)
64
+ debug "[#{@stack.size}] -> #{result.name}, now #{current.name}" if @stack.size > 1
58
65
  result
59
66
  end
60
67
 
@@ -70,7 +77,7 @@ module Chewy
70
77
  def debug(string)
71
78
  return unless Chewy.logger && Chewy.logger.debug?
72
79
  line = caller.detect { |l| l !~ %r{lib/chewy/strategy.rb:|lib/chewy.rb:} }
73
- Chewy.logger.debug(["DEBUG: Chewy strategies stack: #{string}", line.sub(/:in\s.+$/, '')].join(' @ '))
80
+ Chewy.logger.debug(["Chewy strategies stack: #{string}", line.sub(/:in\s.+$/, '')].join(' @ '))
74
81
  end
75
82
 
76
83
  def resolve(name)
@@ -14,6 +14,7 @@ module Chewy
14
14
  queue_as :chewy
15
15
 
16
16
  def perform(type, ids, options = {})
17
+ options[:refresh] = !Chewy.disable_refresh_async if Chewy.disable_refresh_async
17
18
  type.constantize.import!(ids, options)
18
19
  end
19
20
  end
@@ -16,9 +16,7 @@ module Chewy
16
16
  @stash = {}
17
17
  end
18
18
 
19
- def update(type, objects, options = {})
20
- ActiveSupport::Deprecation.warn('`urgent: true` option is deprecated and is not effective inside `:atomic` strategy, use `Chewy.strategy(:urgent)` strategy instead') if options.key?(:urgent)
21
-
19
+ def update(type, objects, _options = {})
22
20
  @stash[type] ||= []
23
21
  @stash[type] |= type.send(:build_root).id ? Array.wrap(objects) : type.adapter.identify(objects)
24
22
  end
@@ -8,7 +8,7 @@ module Chewy
8
8
  # end
9
9
  #
10
10
  class Bypass < Base
11
- def update(type, objects, options = {}); end
11
+ def update(type, objects, _options = {}); end
12
12
  end
13
13
  end
14
14
  end