chewy 0.9.0 → 0.10.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/.gitignore +1 -0
- data/.rubocop.yml +24 -2
- data/.rubocop_todo.yml +2 -2
- data/.travis.yml +38 -21
- data/.yardopts +5 -0
- data/Appraisals +55 -27
- data/CHANGELOG.md +57 -12
- data/Gemfile +14 -10
- data/LEGACY_DSL.md +497 -0
- data/README.md +249 -515
- data/chewy.gemspec +5 -4
- data/gemfiles/rails.4.0.activerecord.gemfile +14 -0
- data/gemfiles/rails.4.1.activerecord.gemfile +14 -0
- data/gemfiles/rails.4.2.activerecord.gemfile +8 -10
- data/gemfiles/rails.4.2.mongoid.5.1.gemfile +9 -10
- data/gemfiles/rails.5.0.activerecord.gemfile +8 -10
- data/gemfiles/rails.5.0.mongoid.6.0.gemfile +15 -0
- data/gemfiles/rails.5.1.activerecord.gemfile +15 -0
- data/gemfiles/rails.5.1.mongoid.6.1.gemfile +15 -0
- data/gemfiles/sequel.4.45.gemfile +11 -0
- data/lib/chewy.rb +77 -43
- data/lib/chewy/config.rb +44 -7
- data/lib/chewy/errors.rb +2 -2
- data/lib/chewy/fields/base.rb +39 -32
- data/lib/chewy/fields/root.rb +33 -7
- data/lib/chewy/index.rb +237 -149
- data/lib/chewy/index/actions.rb +85 -28
- data/lib/chewy/index/aliases.rb +2 -1
- data/lib/chewy/index/settings.rb +9 -5
- data/lib/chewy/index/specification.rb +58 -0
- data/lib/chewy/journal.rb +40 -92
- data/lib/chewy/query.rb +43 -27
- data/lib/chewy/query/compose.rb +13 -13
- data/lib/chewy/query/criteria.rb +13 -13
- data/lib/chewy/query/filters.rb +1 -1
- data/lib/chewy/query/loading.rb +1 -1
- data/lib/chewy/query/nodes/and.rb +2 -2
- data/lib/chewy/query/nodes/bool.rb +1 -1
- data/lib/chewy/query/nodes/equal.rb +2 -2
- data/lib/chewy/query/nodes/exists.rb +1 -1
- data/lib/chewy/query/nodes/has_relation.rb +2 -2
- data/lib/chewy/query/nodes/match_all.rb +1 -1
- data/lib/chewy/query/nodes/missing.rb +1 -1
- data/lib/chewy/query/nodes/not.rb +2 -2
- data/lib/chewy/query/nodes/or.rb +2 -2
- data/lib/chewy/query/nodes/prefix.rb +1 -1
- data/lib/chewy/query/nodes/query.rb +2 -2
- data/lib/chewy/query/nodes/range.rb +4 -4
- data/lib/chewy/query/nodes/regexp.rb +4 -4
- data/lib/chewy/query/nodes/script.rb +3 -3
- data/lib/chewy/query/pagination.rb +10 -1
- data/lib/chewy/railtie.rb +1 -0
- data/lib/chewy/rake_helper.rb +265 -48
- data/lib/chewy/rspec/update_index.rb +30 -22
- data/lib/chewy/search.rb +78 -21
- data/lib/chewy/search/loader.rb +83 -0
- data/lib/chewy/{query → search}/pagination/kaminari.rb +13 -5
- data/lib/chewy/search/pagination/will_paginate.rb +41 -0
- data/lib/chewy/search/parameters.rb +150 -0
- data/lib/chewy/search/parameters/aggs.rb +16 -0
- data/lib/chewy/search/parameters/concerns/bool_storage.rb +24 -0
- data/lib/chewy/search/parameters/concerns/hash_storage.rb +23 -0
- data/lib/chewy/search/parameters/concerns/integer_storage.rb +14 -0
- data/lib/chewy/search/parameters/concerns/query_storage.rb +237 -0
- data/lib/chewy/search/parameters/concerns/string_array_storage.rb +23 -0
- data/lib/chewy/search/parameters/concerns/string_storage.rb +14 -0
- data/lib/chewy/search/parameters/docvalue_fields.rb +12 -0
- data/lib/chewy/search/parameters/explain.rb +16 -0
- data/lib/chewy/search/parameters/filter.rb +47 -0
- data/lib/chewy/search/parameters/highlight.rb +16 -0
- data/lib/chewy/search/parameters/indices_boost.rb +52 -0
- data/lib/chewy/search/parameters/limit.rb +17 -0
- data/lib/chewy/search/parameters/load.rb +32 -0
- data/lib/chewy/search/parameters/min_score.rb +16 -0
- data/lib/chewy/search/parameters/none.rb +27 -0
- data/lib/chewy/search/parameters/offset.rb +17 -0
- data/lib/chewy/search/parameters/order.rb +64 -0
- data/lib/chewy/search/parameters/post_filter.rb +19 -0
- data/lib/chewy/search/parameters/preference.rb +16 -0
- data/lib/chewy/search/parameters/profile.rb +16 -0
- data/lib/chewy/search/parameters/query.rb +19 -0
- data/lib/chewy/search/parameters/request_cache.rb +27 -0
- data/lib/chewy/search/parameters/rescore.rb +29 -0
- data/lib/chewy/search/parameters/script_fields.rb +16 -0
- data/lib/chewy/search/parameters/search_after.rb +20 -0
- data/lib/chewy/search/parameters/search_type.rb +16 -0
- data/lib/chewy/search/parameters/source.rb +73 -0
- data/lib/chewy/search/parameters/storage.rb +95 -0
- data/lib/chewy/search/parameters/stored_fields.rb +63 -0
- data/lib/chewy/search/parameters/suggest.rb +16 -0
- data/lib/chewy/search/parameters/terminate_after.rb +16 -0
- data/lib/chewy/search/parameters/timeout.rb +16 -0
- data/lib/chewy/search/parameters/track_scores.rb +16 -0
- data/lib/chewy/search/parameters/types.rb +20 -0
- data/lib/chewy/search/parameters/version.rb +16 -0
- data/lib/chewy/search/query_proxy.rb +257 -0
- data/lib/chewy/search/request.rb +1021 -0
- data/lib/chewy/search/response.rb +119 -0
- data/lib/chewy/search/scoping.rb +50 -0
- data/lib/chewy/search/scrolling.rb +136 -0
- data/lib/chewy/stash.rb +70 -0
- data/lib/chewy/strategy.rb +10 -3
- data/lib/chewy/strategy/active_job.rb +1 -0
- data/lib/chewy/strategy/atomic.rb +1 -3
- data/lib/chewy/strategy/bypass.rb +1 -1
- data/lib/chewy/strategy/resque.rb +1 -0
- data/lib/chewy/strategy/shoryuken.rb +40 -0
- data/lib/chewy/strategy/sidekiq.rb +13 -3
- data/lib/chewy/type.rb +29 -7
- data/lib/chewy/type/actions.rb +26 -2
- data/lib/chewy/type/adapter/active_record.rb +44 -29
- data/lib/chewy/type/adapter/base.rb +27 -7
- data/lib/chewy/type/adapter/mongoid.rb +18 -7
- data/lib/chewy/type/adapter/object.rb +187 -26
- data/lib/chewy/type/adapter/orm.rb +59 -32
- data/lib/chewy/type/adapter/sequel.rb +32 -16
- data/lib/chewy/type/import.rb +145 -191
- data/lib/chewy/type/import/bulk_builder.rb +122 -0
- data/lib/chewy/type/import/bulk_request.rb +76 -0
- data/lib/chewy/type/import/journal_builder.rb +45 -0
- data/lib/chewy/type/import/routine.rb +138 -0
- data/lib/chewy/type/mapping.rb +11 -1
- data/lib/chewy/type/observe.rb +1 -1
- data/lib/chewy/type/syncer.rb +220 -0
- data/lib/chewy/type/witchcraft.rb +27 -13
- data/lib/chewy/type/wrapper.rb +28 -2
- data/lib/chewy/version.rb +1 -1
- data/lib/tasks/chewy.rake +84 -26
- data/spec/chewy/config_spec.rb +82 -1
- data/spec/chewy/fields/base_spec.rb +147 -112
- data/spec/chewy/fields/root_spec.rb +75 -18
- data/spec/chewy/fields/time_fields_spec.rb +2 -3
- data/spec/chewy/index/actions_spec.rb +180 -50
- data/spec/chewy/index/aliases_spec.rb +2 -2
- data/spec/chewy/index/settings_spec.rb +67 -38
- data/spec/chewy/index/specification_spec.rb +160 -0
- data/spec/chewy/index_spec.rb +57 -66
- data/spec/chewy/journal_spec.rb +149 -54
- data/spec/chewy/minitest/helpers_spec.rb +4 -4
- data/spec/chewy/minitest/search_index_receiver_spec.rb +1 -1
- data/spec/chewy/query/criteria_spec.rb +179 -179
- data/spec/chewy/query/filters_spec.rb +15 -15
- data/spec/chewy/query/loading_spec.rb +22 -20
- data/spec/chewy/query/nodes/and_spec.rb +2 -2
- data/spec/chewy/query/nodes/bool_spec.rb +4 -4
- data/spec/chewy/query/nodes/equal_spec.rb +19 -19
- data/spec/chewy/query/nodes/exists_spec.rb +6 -6
- data/spec/chewy/query/nodes/has_child_spec.rb +19 -19
- data/spec/chewy/query/nodes/has_parent_spec.rb +19 -19
- data/spec/chewy/query/nodes/missing_spec.rb +5 -5
- data/spec/chewy/query/nodes/not_spec.rb +3 -2
- data/spec/chewy/query/nodes/or_spec.rb +2 -2
- data/spec/chewy/query/nodes/prefix_spec.rb +5 -5
- data/spec/chewy/query/nodes/query_spec.rb +2 -2
- data/spec/chewy/query/nodes/range_spec.rb +18 -18
- data/spec/chewy/query/nodes/raw_spec.rb +1 -1
- data/spec/chewy/query/nodes/regexp_spec.rb +14 -14
- data/spec/chewy/query/nodes/script_spec.rb +4 -4
- data/spec/chewy/query/pagination/kaminari_spec.rb +3 -55
- data/spec/chewy/query/pagination/will_paginate_spec.rb +5 -0
- data/spec/chewy/query/pagination_spec.rb +25 -21
- data/spec/chewy/query_spec.rb +501 -560
- data/spec/chewy/rake_helper_spec.rb +368 -0
- data/spec/chewy/repository_spec.rb +4 -4
- data/spec/chewy/rspec/update_index_spec.rb +89 -56
- data/spec/chewy/runtime_spec.rb +2 -2
- data/spec/chewy/search/loader_spec.rb +117 -0
- data/spec/chewy/search/pagination/kaminari_examples.rb +71 -0
- data/spec/chewy/search/pagination/kaminari_spec.rb +17 -0
- data/spec/chewy/search/pagination/will_paginate_examples.rb +63 -0
- data/spec/chewy/search/pagination/will_paginate_spec.rb +17 -0
- data/spec/chewy/search/parameters/aggs_spec.rb +5 -0
- data/spec/chewy/search/parameters/bool_storage_examples.rb +53 -0
- data/spec/chewy/search/parameters/docvalue_fields_spec.rb +5 -0
- data/spec/chewy/search/parameters/explain_spec.rb +5 -0
- data/spec/chewy/search/parameters/filter_spec.rb +5 -0
- data/spec/chewy/search/parameters/hash_storage_examples.rb +59 -0
- data/spec/chewy/search/parameters/highlight_spec.rb +5 -0
- data/spec/chewy/search/parameters/indices_boost_spec.rb +83 -0
- data/spec/chewy/search/parameters/integer_storage_examples.rb +32 -0
- data/spec/chewy/search/parameters/limit_spec.rb +5 -0
- data/spec/chewy/search/parameters/load_spec.rb +60 -0
- data/spec/chewy/search/parameters/min_score_spec.rb +32 -0
- data/spec/chewy/search/parameters/none_spec.rb +5 -0
- data/spec/chewy/search/parameters/offset_spec.rb +5 -0
- data/spec/chewy/search/parameters/order_spec.rb +65 -0
- data/spec/chewy/search/parameters/post_filter_spec.rb +5 -0
- data/spec/chewy/search/parameters/preference_spec.rb +5 -0
- data/spec/chewy/search/parameters/profile_spec.rb +5 -0
- data/spec/chewy/search/parameters/query_spec.rb +5 -0
- data/spec/chewy/search/parameters/query_storage_examples.rb +388 -0
- data/spec/chewy/search/parameters/request_cache_spec.rb +67 -0
- data/spec/chewy/search/parameters/rescore_spec.rb +62 -0
- data/spec/chewy/search/parameters/script_fields_spec.rb +5 -0
- data/spec/chewy/search/parameters/search_after_spec.rb +32 -0
- data/spec/chewy/search/parameters/search_type_spec.rb +5 -0
- data/spec/chewy/search/parameters/source_spec.rb +156 -0
- data/spec/chewy/search/parameters/storage_spec.rb +60 -0
- data/spec/chewy/search/parameters/stored_fields_spec.rb +126 -0
- data/spec/chewy/search/parameters/string_array_storage_examples.rb +63 -0
- data/spec/chewy/search/parameters/string_storage_examples.rb +32 -0
- data/spec/chewy/search/parameters/suggest_spec.rb +5 -0
- data/spec/chewy/search/parameters/terminate_after_spec.rb +5 -0
- data/spec/chewy/search/parameters/timeout_spec.rb +5 -0
- data/spec/chewy/search/parameters/track_scores_spec.rb +5 -0
- data/spec/chewy/search/parameters/types_spec.rb +5 -0
- data/spec/chewy/search/parameters/version_spec.rb +5 -0
- data/spec/chewy/search/parameters_spec.rb +130 -0
- data/spec/chewy/search/query_proxy_spec.rb +68 -0
- data/spec/chewy/search/request_spec.rb +669 -0
- data/spec/chewy/search/response_spec.rb +192 -0
- data/spec/chewy/search/scrolling_spec.rb +169 -0
- data/spec/chewy/search_spec.rb +13 -6
- data/spec/chewy/stash_spec.rb +95 -0
- data/spec/chewy/strategy/active_job_spec.rb +6 -0
- data/spec/chewy/strategy/resque_spec.rb +6 -0
- data/spec/chewy/strategy/shoryuken_spec.rb +64 -0
- data/spec/chewy/strategy/sidekiq_spec.rb +8 -0
- data/spec/chewy/strategy_spec.rb +6 -6
- data/spec/chewy/type/actions_spec.rb +29 -10
- data/spec/chewy/type/adapter/active_record_spec.rb +203 -91
- data/spec/chewy/type/adapter/mongoid_spec.rb +112 -54
- data/spec/chewy/type/adapter/object_spec.rb +101 -28
- data/spec/chewy/type/adapter/sequel_spec.rb +149 -82
- data/spec/chewy/type/import/bulk_builder_spec.rb +279 -0
- data/spec/chewy/type/import/bulk_request_spec.rb +102 -0
- data/spec/chewy/type/import/journal_builder_spec.rb +95 -0
- data/spec/chewy/type/import/routine_spec.rb +110 -0
- data/spec/chewy/type/import_spec.rb +350 -271
- data/spec/chewy/type/mapping_spec.rb +54 -18
- data/spec/chewy/type/observe_spec.rb +5 -1
- data/spec/chewy/type/syncer_spec.rb +123 -0
- data/spec/chewy/type/witchcraft_spec.rb +45 -29
- data/spec/chewy/type/wrapper_spec.rb +63 -23
- data/spec/chewy/type_spec.rb +28 -7
- data/spec/chewy_spec.rb +75 -7
- data/spec/spec_helper.rb +5 -2
- data/spec/support/active_record.rb +5 -1
- data/spec/support/class_helpers.rb +0 -14
- data/spec/support/mongoid.rb +15 -3
- data/spec/support/sequel.rb +6 -1
- metadata +198 -37
- data/gemfiles/rails.3.2.activerecord.gemfile +0 -16
- data/gemfiles/rails.3.2.activerecord.kaminari.gemfile +0 -15
- data/gemfiles/rails.3.2.activerecord.will_paginate.gemfile +0 -15
- data/gemfiles/rails.4.2.activerecord.kaminari.gemfile +0 -16
- data/gemfiles/rails.4.2.activerecord.will_paginate.gemfile +0 -16
- data/gemfiles/rails.4.2.mongoid.4.0.gemfile +0 -16
- data/gemfiles/rails.4.2.mongoid.4.0.kaminari.gemfile +0 -15
- data/gemfiles/rails.4.2.mongoid.4.0.will_paginate.gemfile +0 -15
- data/gemfiles/rails.4.2.mongoid.5.1.kaminari.gemfile +0 -15
- data/gemfiles/rails.4.2.mongoid.5.1.will_paginate.gemfile +0 -15
- data/gemfiles/rails.5.0.activerecord.kaminari.gemfile +0 -16
- data/gemfiles/rails.5.0.activerecord.will_paginate.gemfile +0 -16
- data/gemfiles/sequel.4.38.gemfile +0 -14
- data/lib/chewy/journal/apply.rb +0 -31
- data/lib/chewy/journal/clean.rb +0 -24
- data/lib/chewy/journal/entry.rb +0 -83
- data/lib/chewy/journal/query.rb +0 -87
- data/lib/chewy/query/pagination/will_paginate.rb +0 -27
- data/lib/chewy/query/scoping.rb +0 -20
- data/spec/chewy/journal/apply_spec.rb +0 -120
- data/spec/chewy/journal/entry_spec.rb +0 -237
- data/spec/chewy/query/pagination/will_paginage_spec.rb +0 -59
@@ -0,0 +1,119 @@
|
|
1
|
+
module Chewy
|
2
|
+
module Search
|
3
|
+
# This class is a ES response hash wrapper.
|
4
|
+
#
|
5
|
+
# @see https://www.elastic.co/guide/en/elasticsearch/reference/current/_the_search_api.html
|
6
|
+
class Response
|
7
|
+
# @param body [Hash] response body hash
|
8
|
+
# @param loader [Chewy::Search::Loader] loader instance
|
9
|
+
def initialize(body, loader, paginator = nil)
|
10
|
+
@body = body
|
11
|
+
@loader = loader
|
12
|
+
@paginator = paginator
|
13
|
+
end
|
14
|
+
|
15
|
+
# Raw response `hits` collection. Returns empty array is something went wrong.
|
16
|
+
#
|
17
|
+
# @return [Array<Hash>]
|
18
|
+
def hits
|
19
|
+
@hits ||= hits_root['hits'] || []
|
20
|
+
end
|
21
|
+
|
22
|
+
# Response `total` field. Returns `0` if something went wrong.
|
23
|
+
#
|
24
|
+
# @return [Integer]
|
25
|
+
def total
|
26
|
+
@total ||= hits_root['total'] || 0
|
27
|
+
end
|
28
|
+
|
29
|
+
# Response `max_score` field.
|
30
|
+
#
|
31
|
+
# @return [Float]
|
32
|
+
def max_score
|
33
|
+
@max_score ||= hits_root['max_score']
|
34
|
+
end
|
35
|
+
|
36
|
+
# Duration of the request handling in ms according to ES.
|
37
|
+
#
|
38
|
+
# @return [Integer]
|
39
|
+
def took
|
40
|
+
@took ||= @body['took']
|
41
|
+
end
|
42
|
+
|
43
|
+
# Has the request been timed out?
|
44
|
+
#
|
45
|
+
# @return [true, false]
|
46
|
+
def timed_out?
|
47
|
+
@timed_out ||= @body['timed_out']
|
48
|
+
end
|
49
|
+
|
50
|
+
# The `suggest` response part. Returns empty hash if suggests
|
51
|
+
# were not requested.
|
52
|
+
#
|
53
|
+
# @return [Hash]
|
54
|
+
def suggest
|
55
|
+
@suggest ||= @body['suggest'] || {}
|
56
|
+
end
|
57
|
+
|
58
|
+
# The `aggregations` response part. Returns empty hash if aggregations
|
59
|
+
# were not requested.
|
60
|
+
#
|
61
|
+
# @return [Hash]
|
62
|
+
def aggs
|
63
|
+
@aggs ||= @body['aggregations'] || {}
|
64
|
+
end
|
65
|
+
alias_method :aggregations, :aggs
|
66
|
+
|
67
|
+
# {Chewy::Type} wrappers collection instantiated on top of hits.
|
68
|
+
#
|
69
|
+
# @return [Array<Chewy::Type>]
|
70
|
+
def wrappers
|
71
|
+
@wrappers ||= hits.map do |hit|
|
72
|
+
@loader.derive_type(hit['_index'], hit['_type']).build(hit)
|
73
|
+
end
|
74
|
+
end
|
75
|
+
|
76
|
+
# ORM/ODM objects that had been a source for Chewy import
|
77
|
+
# and now loaded from the DB using hits ids. Uses
|
78
|
+
# {Chewy::Search::Request#load} passed options for loading.
|
79
|
+
#
|
80
|
+
# @see Chewy::Search::Request#load
|
81
|
+
# @see Chewy::Search::Loader
|
82
|
+
# @return [Array<Object>]
|
83
|
+
def objects
|
84
|
+
@objects ||= begin
|
85
|
+
objects = @loader.load(hits)
|
86
|
+
if @paginator
|
87
|
+
@paginator.call(objects)
|
88
|
+
else
|
89
|
+
objects
|
90
|
+
end
|
91
|
+
end
|
92
|
+
end
|
93
|
+
alias_method :records, :objects
|
94
|
+
alias_method :documents, :objects
|
95
|
+
|
96
|
+
# This method is used in cases when you need to iterate through
|
97
|
+
# both of the collections simultaneously.
|
98
|
+
#
|
99
|
+
# @example
|
100
|
+
# scope.each do |wrapper|
|
101
|
+
# scope.object_hash[wrapper]
|
102
|
+
# end
|
103
|
+
# @see #wrappers
|
104
|
+
# @see #objects
|
105
|
+
# @return [{Chewy::Type => Object}] a hash with wrappers as keys and ORM/ODM objects as values
|
106
|
+
def object_hash
|
107
|
+
@object_hash ||= wrappers.zip(objects).to_h
|
108
|
+
end
|
109
|
+
alias_method :record_hash, :object_hash
|
110
|
+
alias_method :document_hash, :object_hash
|
111
|
+
|
112
|
+
private
|
113
|
+
|
114
|
+
def hits_root
|
115
|
+
@body.fetch('hits', {})
|
116
|
+
end
|
117
|
+
end
|
118
|
+
end
|
119
|
+
end
|
@@ -0,0 +1,50 @@
|
|
1
|
+
module Chewy
|
2
|
+
module Search
|
3
|
+
# This module along with {Chewy::Search} provides an ability to
|
4
|
+
# use names scopes.
|
5
|
+
#
|
6
|
+
# @example
|
7
|
+
# class UsersIndex < Chewy::Index
|
8
|
+
# def self.by_name(name)
|
9
|
+
# query(match: {name: name})
|
10
|
+
# end
|
11
|
+
#
|
12
|
+
# define_type :user do
|
13
|
+
# def self.by_age(age)
|
14
|
+
# filter(term: {age: age})
|
15
|
+
# end
|
16
|
+
# end
|
17
|
+
# end
|
18
|
+
#
|
19
|
+
# UsersIndex.limit(10).by_name('Martin')
|
20
|
+
# # => <UsersIndex::Query {..., :body=>{:size=>10, :query=>{:match=>{:name=>"Martin"}}}}>
|
21
|
+
# UsersIndex::User.limit(10).by_name('Martin').by_age(42)
|
22
|
+
# # => <UsersIndex::User::Query {..., :body=>{:size=>10, :query=>{:bool=>{
|
23
|
+
# # :must=>{:match=>{:name=>"Martin"}},
|
24
|
+
# # :filter=>{:term=>{:age=>42}}}}}}>
|
25
|
+
module Scoping
|
26
|
+
extend ActiveSupport::Concern
|
27
|
+
|
28
|
+
module ClassMethods
|
29
|
+
# The scopes stack.
|
30
|
+
#
|
31
|
+
# @return [Array<Chewy::Search::Reques>] array of scopes
|
32
|
+
def scopes
|
33
|
+
Thread.current[:chewy_scopes] ||= []
|
34
|
+
end
|
35
|
+
end
|
36
|
+
|
37
|
+
# Wraps any method to make it contents be executed inside the
|
38
|
+
# current request scope.
|
39
|
+
#
|
40
|
+
# @see Chewy::Search::ClassMethods#all
|
41
|
+
# @yield executes the block after the current context is put at the top of the scope stack
|
42
|
+
def scoping
|
43
|
+
self.class.scopes.push(self)
|
44
|
+
yield
|
45
|
+
ensure
|
46
|
+
self.class.scopes.pop
|
47
|
+
end
|
48
|
+
end
|
49
|
+
end
|
50
|
+
end
|
@@ -0,0 +1,136 @@
|
|
1
|
+
module Chewy
|
2
|
+
module Search
|
3
|
+
# This module contains batch requests DSL via ES scroll API. All the methods
|
4
|
+
# are optimized on memory consumption, they are not caching anythig, so
|
5
|
+
# use them when you need to do some single-run stuff on a huge amount of
|
6
|
+
# documents. Don't forget to tune the `scroll` parameter for long-lasting
|
7
|
+
# actions.
|
8
|
+
# All the scroll methods respect the limit value if provided.
|
9
|
+
#
|
10
|
+
# @see https://www.elastic.co/guide/en/elasticsearch/reference/current/search-request-scroll.html
|
11
|
+
module Scrolling
|
12
|
+
# Iterates through the documents of the scope in batches. Limit if overrided
|
13
|
+
# by the `batch_size`. There are 2 possible use-cases: with a block or without.
|
14
|
+
#
|
15
|
+
# @param batch_size [Integer] batch size obviously, replaces `size` query parameter
|
16
|
+
# @param scroll [String] cursor expiration time
|
17
|
+
#
|
18
|
+
# @overload scroll_batches(batch_size: 1000, scroll: '1m')
|
19
|
+
# @example
|
20
|
+
# PlaceIndex.scroll_batches { |batch| batch.each { |hit| p hit['_id'] } }
|
21
|
+
# @yieldparam batch [Array<Hash>] block is executed for each batch of hits
|
22
|
+
#
|
23
|
+
# @overload scroll_batches(batch_size: 1000, scroll: '1m')
|
24
|
+
# @example
|
25
|
+
# PlaceIndex.scroll_batches.flat_map { |batch| batch.map { |hit| hit['_id'] } }
|
26
|
+
# @return [Enumerator] a standard ruby Enumerator
|
27
|
+
def scroll_batches(batch_size: Request::DEFAULT_BATCH_SIZE, scroll: Request::DEFAULT_SCROLL)
|
28
|
+
return enum_for(:scroll_batches, batch_size: batch_size, scroll: scroll) unless block_given?
|
29
|
+
|
30
|
+
result = perform(size: batch_size, scroll: scroll)
|
31
|
+
total = [raw_limit_value, result.fetch('hits', {}).fetch('total', 0)].compact.min
|
32
|
+
last_batch_size = total % batch_size
|
33
|
+
fetched = 0
|
34
|
+
|
35
|
+
loop do
|
36
|
+
hits = result.fetch('hits', {}).fetch('hits', [])
|
37
|
+
fetched += hits.size
|
38
|
+
hits = hits.first(last_batch_size) if last_batch_size != 0 && fetched >= total
|
39
|
+
yield(hits) if hits.present?
|
40
|
+
break if fetched >= total
|
41
|
+
scroll_id = result['_scroll_id']
|
42
|
+
result = perform_scroll(scroll: scroll, scroll_id: scroll_id)
|
43
|
+
end
|
44
|
+
end
|
45
|
+
|
46
|
+
# @!method scroll_hits(batch_size: 1000, scroll: '1m')
|
47
|
+
# Iterates through the documents of the scope in batches. Yields each hit separately.
|
48
|
+
#
|
49
|
+
# @param batch_size [Integer] batch size obviously, replaces `size` query parameter
|
50
|
+
# @param scroll [String] cursor expiration time
|
51
|
+
#
|
52
|
+
# @overload scroll_hits(batch_size: 1000, scroll: '1m')
|
53
|
+
# @example
|
54
|
+
# PlaceIndex.scroll_hits { |hit| p hit['_id'] }
|
55
|
+
# @yieldparam hit [Hash] block is executed for each hit
|
56
|
+
#
|
57
|
+
# @overload scroll_hits(batch_size: 1000, scroll: '1m')
|
58
|
+
# @example
|
59
|
+
# PlaceIndex.scroll_hits.map { |hit| hit['_id'] }
|
60
|
+
# @return [Enumerator] a standard ruby Enumerator
|
61
|
+
def scroll_hits(**options)
|
62
|
+
return enum_for(:scroll_hits, **options) unless block_given?
|
63
|
+
|
64
|
+
scroll_batches(**options).each do |batch|
|
65
|
+
batch.each { |hit| yield hit }
|
66
|
+
end
|
67
|
+
end
|
68
|
+
|
69
|
+
# @!method scroll_wrappers(batch_size: 1000, scroll: '1m')
|
70
|
+
# Iterates through the documents of the scope in batches. Yields
|
71
|
+
# each hit wrapped with {Chewy::Type}.
|
72
|
+
#
|
73
|
+
# @param batch_size [Integer] batch size obviously, replaces `size` query parameter
|
74
|
+
# @param scroll [String] cursor expiration time
|
75
|
+
#
|
76
|
+
# @overload scroll_wrappers(batch_size: 1000, scroll: '1m')
|
77
|
+
# @example
|
78
|
+
# PlaceIndex.scroll_wrappers { |object| p object.id }
|
79
|
+
# @yieldparam object [Chewy::Type] block is executed for each hit object
|
80
|
+
#
|
81
|
+
# @overload scroll_wrappers(batch_size: 1000, scroll: '1m')
|
82
|
+
# @example
|
83
|
+
# PlaceIndex.scroll_wrappers.map { |object| object.id }
|
84
|
+
# @return [Enumerator] a standard ruby Enumerator
|
85
|
+
def scroll_wrappers(**options)
|
86
|
+
return enum_for(:scroll_wrappers, **options) unless block_given?
|
87
|
+
|
88
|
+
scroll_hits(**options).each do |hit|
|
89
|
+
yield loader.derive_type(hit['_index'], hit['_type']).build(hit)
|
90
|
+
end
|
91
|
+
end
|
92
|
+
|
93
|
+
# @!method scroll_objects(batch_size: 1000, scroll: '1m')
|
94
|
+
# Iterates through the documents of the scope in batches. Performs load
|
95
|
+
# operation for each batch and then yields each loaded ORM/ODM object.
|
96
|
+
# Uses {Chewy::Search::Request#load} passed options for loading.
|
97
|
+
#
|
98
|
+
# @note If the record is not found it yields nil instead.
|
99
|
+
# @see Chewy::Search::Request#load
|
100
|
+
# @see Chewy::Search::Loader
|
101
|
+
# @param batch_size [Integer] batch size obviously, replaces `size` query parameter
|
102
|
+
# @param scroll [String] cursor expiration time
|
103
|
+
#
|
104
|
+
# @overload scroll_objects(batch_size: 1000, scroll: '1m')
|
105
|
+
# @example
|
106
|
+
# PlaceIndex.scroll_objects { |record| p record.id }
|
107
|
+
# @yieldparam record [Object] block is executed for each record loaded
|
108
|
+
#
|
109
|
+
# @overload scroll_objects(batch_size: 1000, scroll: '1m')
|
110
|
+
# @example
|
111
|
+
# PlaceIndex.scroll_objects.map { |record| record.id }
|
112
|
+
# @return [Enumerator] a standard ruby Enumerator
|
113
|
+
def scroll_objects(**options)
|
114
|
+
return enum_for(:scroll_objects, **options) unless block_given?
|
115
|
+
|
116
|
+
except(:source, :stored_fields, :script_fields, :docvalue_fields)
|
117
|
+
.source(false).scroll_batches(**options).each do |batch|
|
118
|
+
loader.load(batch).each { |object| yield object }
|
119
|
+
end
|
120
|
+
end
|
121
|
+
alias_method :scroll_records, :scroll_objects
|
122
|
+
alias_method :scroll_documents, :scroll_objects
|
123
|
+
|
124
|
+
private
|
125
|
+
|
126
|
+
def perform_scroll(body)
|
127
|
+
ActiveSupport::Notifications.instrument 'search_query.chewy',
|
128
|
+
request: body, indexes: _indexes, types: _types,
|
129
|
+
index: _indexes.one? ? _indexes.first : _indexes,
|
130
|
+
type: _types.one? ? _types.first : _types do
|
131
|
+
Chewy.client.scroll(body)
|
132
|
+
end
|
133
|
+
end
|
134
|
+
end
|
135
|
+
end
|
136
|
+
end
|
data/lib/chewy/stash.rb
ADDED
@@ -0,0 +1,70 @@
|
|
1
|
+
module Chewy
|
2
|
+
# This class is the main storage for Chewy service data,
|
3
|
+
# Now index raw specifications are stored in the `chewy_stash`
|
4
|
+
# index. In the future the journal will be moved here as well.
|
5
|
+
#
|
6
|
+
# @see Chewy::Index::Specification
|
7
|
+
class Stash < Chewy::Index
|
8
|
+
index_name 'chewy_stash'
|
9
|
+
|
10
|
+
define_type :specification do
|
11
|
+
default_import_options journal: false
|
12
|
+
|
13
|
+
field :value, index: 'no'
|
14
|
+
end
|
15
|
+
|
16
|
+
define_type :journal do # rubocop:disable Metrics/BlockLength
|
17
|
+
default_import_options journal: false
|
18
|
+
|
19
|
+
field :index_name, type: 'string', index: 'not_analyzed'
|
20
|
+
field :type_name, type: 'string', index: 'not_analyzed'
|
21
|
+
field :action, type: 'string', index: 'not_analyzed'
|
22
|
+
field :references, type: 'string', index: 'no'
|
23
|
+
field :created_at, type: 'date'
|
24
|
+
|
25
|
+
# Loads all entries since the specified time.
|
26
|
+
#
|
27
|
+
# @param since_time [Time, DateTime] a timestamp from which we load a journal
|
28
|
+
# @param only [Chewy::Index, Array<Chewy::Index>] journal entries related to these indices will be loaded only
|
29
|
+
def self.entries(since_time, only: [])
|
30
|
+
self.for(only).filter(range: {created_at: {gt: since_time}})
|
31
|
+
end
|
32
|
+
|
33
|
+
# Cleans up all the journal entries until the specified time. If nothing is
|
34
|
+
# specified - cleans up everything.
|
35
|
+
#
|
36
|
+
# @param since_time [Time, DateTime] the time top boundary
|
37
|
+
# @param only [Chewy::Index, Array<Chewy::Index>] indexes to clean up journal entries for
|
38
|
+
def self.clean(until_time = nil, only: [])
|
39
|
+
scope = self.for(only)
|
40
|
+
scope = scope.filter(range: {created_at: {lte: until_time}}) if until_time
|
41
|
+
scope.delete_all
|
42
|
+
end
|
43
|
+
|
44
|
+
# Selects all the journal entries for the specified indices.
|
45
|
+
#
|
46
|
+
# @param indices [Chewy::Index, Array<Chewy::Index>]
|
47
|
+
def self.for(*something)
|
48
|
+
something = something.flatten.compact
|
49
|
+
types = something.flat_map { |s| Chewy.derive_types(s) }
|
50
|
+
return none if something.present? && types.blank?
|
51
|
+
scope = all
|
52
|
+
types.group_by(&:index).each do |index, index_types|
|
53
|
+
scope = scope.or(
|
54
|
+
filter(term: {index_name: index.derivable_name})
|
55
|
+
.filter(terms: {type_name: index_types.map(&:type_name)})
|
56
|
+
)
|
57
|
+
end
|
58
|
+
scope
|
59
|
+
end
|
60
|
+
|
61
|
+
def type
|
62
|
+
@type ||= Chewy.derive_type("#{index_name}##{type_name}")
|
63
|
+
end
|
64
|
+
|
65
|
+
def references
|
66
|
+
@references ||= Array.wrap(@attributes['references']).map { |r| JSON.load(r) } # rubocop:disable Security/JSONLoad
|
67
|
+
end
|
68
|
+
end
|
69
|
+
end
|
70
|
+
end
|
data/lib/chewy/strategy.rb
CHANGED
@@ -17,6 +17,13 @@ rescue LoadError
|
|
17
17
|
nil
|
18
18
|
end
|
19
19
|
|
20
|
+
begin
|
21
|
+
require 'shoryuken'
|
22
|
+
require 'chewy/strategy/shoryuken'
|
23
|
+
rescue LoadError
|
24
|
+
nil
|
25
|
+
end
|
26
|
+
|
20
27
|
begin
|
21
28
|
require 'active_job'
|
22
29
|
require 'chewy/strategy/active_job'
|
@@ -47,14 +54,14 @@ module Chewy
|
|
47
54
|
|
48
55
|
def push(name)
|
49
56
|
result = @stack.push resolve(name).new
|
50
|
-
debug "[#{@stack.size}] <- #{current.name}"
|
57
|
+
debug "[#{@stack.size - 1}] <- #{current.name}" if @stack.size > 2
|
51
58
|
result
|
52
59
|
end
|
53
60
|
|
54
61
|
def pop
|
55
62
|
raise "Can't pop root strategy" if @stack.one?
|
56
|
-
debug "[#{@stack.size}] -> #{current.name}"
|
57
63
|
result = @stack.pop.tap(&:leave)
|
64
|
+
debug "[#{@stack.size}] -> #{result.name}, now #{current.name}" if @stack.size > 1
|
58
65
|
result
|
59
66
|
end
|
60
67
|
|
@@ -70,7 +77,7 @@ module Chewy
|
|
70
77
|
def debug(string)
|
71
78
|
return unless Chewy.logger && Chewy.logger.debug?
|
72
79
|
line = caller.detect { |l| l !~ %r{lib/chewy/strategy.rb:|lib/chewy.rb:} }
|
73
|
-
Chewy.logger.debug(["
|
80
|
+
Chewy.logger.debug(["Chewy strategies stack: #{string}", line.sub(/:in\s.+$/, '')].join(' @ '))
|
74
81
|
end
|
75
82
|
|
76
83
|
def resolve(name)
|
@@ -16,9 +16,7 @@ module Chewy
|
|
16
16
|
@stash = {}
|
17
17
|
end
|
18
18
|
|
19
|
-
def update(type, objects,
|
20
|
-
ActiveSupport::Deprecation.warn('`urgent: true` option is deprecated and is not effective inside `:atomic` strategy, use `Chewy.strategy(:urgent)` strategy instead') if options.key?(:urgent)
|
21
|
-
|
19
|
+
def update(type, objects, _options = {})
|
22
20
|
@stash[type] ||= []
|
23
21
|
@stash[type] |= type.send(:build_root).id ? Array.wrap(objects) : type.adapter.identify(objects)
|
24
22
|
end
|