source_monitor 0.2.0 → 0.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.claude/agents/rails-concern.md +464 -0
- data/.claude/agents/rails-controller.md +424 -0
- data/.claude/agents/rails-hotwire.md +446 -0
- data/.claude/agents/rails-implement.md +374 -0
- data/.claude/agents/rails-job.md +334 -0
- data/.claude/agents/rails-lint.md +294 -0
- data/.claude/agents/rails-mailer.md +371 -0
- data/.claude/agents/rails-migration.md +449 -0
- data/.claude/agents/rails-model.md +420 -0
- data/.claude/agents/rails-policy.md +443 -0
- data/.claude/agents/rails-presenter.md +427 -0
- data/.claude/agents/rails-query.md +412 -0
- data/.claude/agents/rails-review.md +490 -0
- data/.claude/agents/rails-service.md +458 -0
- data/.claude/agents/rails-state-records.md +465 -0
- data/.claude/agents/rails-tdd.md +314 -0
- data/.claude/agents/rails-test.md +441 -0
- data/.claude/agents/rails-view-component.md +418 -0
- data/.claude/hooks/block-secrets.sh +52 -0
- data/.claude/settings.json +85 -0
- data/.claude/skills/action-cable-patterns/SKILL.md +296 -0
- data/.claude/skills/action-mailer-patterns/SKILL.md +295 -0
- data/.claude/skills/active-storage-setup/SKILL.md +311 -0
- data/.claude/skills/api-versioning/SKILL.md +294 -0
- data/.claude/skills/authentication-flow/SKILL.md +335 -0
- data/.claude/skills/authentication-flow/reference/current.md +248 -0
- data/.claude/skills/authentication-flow/reference/passwordless.md +253 -0
- data/.claude/skills/authentication-flow/reference/sessions.md +201 -0
- data/.claude/skills/authorization-pundit/SKILL.md +462 -0
- data/.claude/skills/caching-strategies/SKILL.md +350 -0
- data/.claude/skills/database-migrations/SKILL.md +354 -0
- data/.claude/skills/form-object-patterns/SKILL.md +399 -0
- data/.claude/skills/hotwire-patterns/SKILL.md +247 -0
- data/.claude/skills/hotwire-patterns/reference/stimulus.md +307 -0
- data/.claude/skills/hotwire-patterns/reference/tailwind-integration.md +112 -0
- data/.claude/skills/hotwire-patterns/reference/turbo-frames.md +158 -0
- data/.claude/skills/hotwire-patterns/reference/turbo-streams.md +218 -0
- data/.claude/skills/i18n-patterns/SKILL.md +320 -0
- data/.claude/skills/install/SKILL.md +367 -0
- data/.claude/skills/performance-optimization/SKILL.md +311 -0
- data/.claude/skills/rails-architecture/SKILL.md +259 -0
- data/.claude/skills/rails-architecture/reference/error-handling.md +333 -0
- data/.claude/skills/rails-architecture/reference/event-tracking.md +142 -0
- data/.claude/skills/rails-architecture/reference/layer-interactions.md +417 -0
- data/.claude/skills/rails-architecture/reference/multi-tenancy.md +152 -0
- data/.claude/skills/rails-architecture/reference/query-patterns.md +342 -0
- data/.claude/skills/rails-architecture/reference/service-patterns.md +286 -0
- data/.claude/skills/rails-architecture/reference/state-records.md +250 -0
- data/.claude/skills/rails-architecture/reference/testing-strategy.md +326 -0
- data/.claude/skills/rails-concern/SKILL.md +399 -0
- data/.claude/skills/rails-controller/SKILL.md +336 -0
- data/.claude/skills/rails-model-generator/SKILL.md +321 -0
- data/.claude/skills/rails-model-generator/reference/validations.md +298 -0
- data/.claude/skills/rails-presenter/SKILL.md +274 -0
- data/.claude/skills/rails-query-object/SKILL.md +289 -0
- data/.claude/skills/rails-service-object/SKILL.md +349 -0
- data/.claude/skills/solid-queue-setup/SKILL.md +307 -0
- data/.claude/skills/tdd-cycle/SKILL.md +359 -0
- data/.claude/skills/viewcomponent-patterns/SKILL.md +333 -0
- data/.gitignore +1 -0
- data/.rubocop.yml +2 -0
- data/.ruby-version +1 -1
- data/.vbw-planning/.notification-log.jsonl +192 -0
- data/.vbw-planning/.session-log.jsonl +871 -0
- data/.vbw-planning/PROJECT.md +51 -0
- data/.vbw-planning/REQUIREMENTS.md +50 -0
- data/.vbw-planning/SHIPPED.md +28 -0
- data/.vbw-planning/codebase/ARCHITECTURE.md +147 -0
- data/.vbw-planning/codebase/CONCERNS.md +99 -0
- data/.vbw-planning/codebase/CONVENTIONS.md +97 -0
- data/.vbw-planning/codebase/DEPENDENCIES.md +100 -0
- data/.vbw-planning/codebase/INDEX.md +86 -0
- data/.vbw-planning/codebase/META.md +42 -0
- data/.vbw-planning/codebase/PATTERNS.md +262 -0
- data/.vbw-planning/codebase/STACK.md +101 -0
- data/.vbw-planning/codebase/STRUCTURE.md +324 -0
- data/.vbw-planning/codebase/TESTING.md +154 -0
- data/.vbw-planning/config.json +12 -0
- data/.vbw-planning/discovery.json +24 -0
- data/.vbw-planning/milestones/default/ROADMAP.md +115 -0
- data/.vbw-planning/milestones/default/STATE.md +83 -0
- data/.vbw-planning/milestones/default/phases/01-coverage-analysis-quick-wins/PLAN-01-SUMMARY.md +56 -0
- data/.vbw-planning/milestones/default/phases/01-coverage-analysis-quick-wins/PLAN-01.md +187 -0
- data/.vbw-planning/milestones/default/phases/01-coverage-analysis-quick-wins/PLAN-02-SUMMARY.md +64 -0
- data/.vbw-planning/milestones/default/phases/01-coverage-analysis-quick-wins/PLAN-02.md +137 -0
- data/.vbw-planning/milestones/default/phases/02-critical-path-test-coverage/PLAN-01-SUMMARY.md +67 -0
- data/.vbw-planning/milestones/default/phases/02-critical-path-test-coverage/PLAN-01.md +142 -0
- data/.vbw-planning/milestones/default/phases/02-critical-path-test-coverage/PLAN-02-SUMMARY.md +64 -0
- data/.vbw-planning/milestones/default/phases/02-critical-path-test-coverage/PLAN-02.md +138 -0
- data/.vbw-planning/milestones/default/phases/02-critical-path-test-coverage/PLAN-03-SUMMARY.md +85 -0
- data/.vbw-planning/milestones/default/phases/02-critical-path-test-coverage/PLAN-03.md +147 -0
- data/.vbw-planning/milestones/default/phases/02-critical-path-test-coverage/PLAN-04-SUMMARY.md +63 -0
- data/.vbw-planning/milestones/default/phases/02-critical-path-test-coverage/PLAN-04.md +129 -0
- data/.vbw-planning/milestones/default/phases/02-critical-path-test-coverage/PLAN-05-SUMMARY.md +74 -0
- data/.vbw-planning/milestones/default/phases/02-critical-path-test-coverage/PLAN-05.md +154 -0
- data/.vbw-planning/milestones/default/phases/03-large-file-refactoring/03-VERIFICATION-wave1.md +303 -0
- data/.vbw-planning/milestones/default/phases/03-large-file-refactoring/03-VERIFICATION.md +510 -0
- data/.vbw-planning/milestones/default/phases/03-large-file-refactoring/PLAN-01-SUMMARY.md +61 -0
- data/.vbw-planning/milestones/default/phases/03-large-file-refactoring/PLAN-01.md +161 -0
- data/.vbw-planning/milestones/default/phases/03-large-file-refactoring/PLAN-02-SUMMARY.md +66 -0
- data/.vbw-planning/milestones/default/phases/03-large-file-refactoring/PLAN-02.md +132 -0
- data/.vbw-planning/milestones/default/phases/03-large-file-refactoring/PLAN-03-SUMMARY.md +59 -0
- data/.vbw-planning/milestones/default/phases/03-large-file-refactoring/PLAN-03.md +171 -0
- data/.vbw-planning/milestones/default/phases/03-large-file-refactoring/PLAN-04-SUMMARY.md +56 -0
- data/.vbw-planning/milestones/default/phases/03-large-file-refactoring/PLAN-04.md +152 -0
- data/.vbw-planning/milestones/default/phases/04-code-quality-conventions-cleanup/04-CONTEXT.md +33 -0
- data/.vbw-planning/milestones/default/phases/04-code-quality-conventions-cleanup/PLAN-01-SUMMARY.md +42 -0
- data/.vbw-planning/milestones/default/phases/04-code-quality-conventions-cleanup/PLAN-01.md +119 -0
- data/.vbw-planning/milestones/default/phases/04-code-quality-conventions-cleanup/PLAN-02-SUMMARY.md +52 -0
- data/.vbw-planning/milestones/default/phases/04-code-quality-conventions-cleanup/PLAN-02.md +195 -0
- data/.vbw-planning/milestones/default/phases/04-code-quality-conventions-cleanup/PLAN-03-SUMMARY.md +79 -0
- data/.vbw-planning/milestones/default/phases/04-code-quality-conventions-cleanup/PLAN-03.md +130 -0
- data/CHANGELOG.md +28 -0
- data/CLAUDE.md +179 -0
- data/Gemfile +8 -0
- data/Gemfile.lock +114 -101
- data/Rakefile +2 -0
- data/app/assets/builds/source_monitor/application.css +2076 -0
- data/app/assets/builds/source_monitor/application.js +2758 -0
- data/app/assets/builds/source_monitor/application.js.map +7 -0
- data/app/controllers/source_monitor/application_controller.rb +2 -0
- data/app/controllers/source_monitor/health_controller.rb +2 -0
- data/app/controllers/source_monitor/import_sessions/bulk_configuration.rb +106 -0
- data/app/controllers/source_monitor/import_sessions/entry_annotation.rb +187 -0
- data/app/controllers/source_monitor/import_sessions/health_check_management.rb +112 -0
- data/app/controllers/source_monitor/import_sessions/opml_parser.rb +130 -0
- data/app/controllers/source_monitor/import_sessions_controller.rb +6 -507
- data/app/controllers/source_monitor/items_controller.rb +2 -0
- data/app/controllers/source_monitor/sources_controller.rb +0 -14
- data/app/helpers/source_monitor/application_helper.rb +4 -112
- data/app/helpers/source_monitor/health_badge_helper.rb +69 -0
- data/app/helpers/source_monitor/table_sort_helper.rb +53 -0
- data/app/jobs/source_monitor/application_job.rb +2 -0
- data/app/models/source_monitor/application_record.rb +2 -0
- data/app/models/source_monitor/log_entry.rb +0 -2
- data/config/coverage_baseline.json +217 -1862
- data/config/routes.rb +2 -0
- data/db/migrate/20251009103000_add_feed_content_readability_to_sources.rb +2 -0
- data/db/migrate/20251014171659_add_performance_indexes.rb +2 -0
- data/db/migrate/20251014172525_add_fetch_status_check_constraint.rb +2 -0
- data/db/migrate/20251108120116_refresh_fetch_status_constraint.rb +2 -0
- data/db/migrate/20260210204022_add_composite_index_to_log_entries.rb +17 -0
- data/lib/source_monitor/assets/bundler.rb +2 -0
- data/lib/source_monitor/assets.rb +2 -0
- data/lib/source_monitor/configuration/authentication_settings.rb +62 -0
- data/lib/source_monitor/configuration/events.rb +60 -0
- data/lib/source_monitor/configuration/fetching_settings.rb +27 -0
- data/lib/source_monitor/configuration/health_settings.rb +27 -0
- data/lib/source_monitor/configuration/http_settings.rb +43 -0
- data/lib/source_monitor/configuration/model_definition.rb +108 -0
- data/lib/source_monitor/configuration/models.rb +36 -0
- data/lib/source_monitor/configuration/realtime_settings.rb +95 -0
- data/lib/source_monitor/configuration/retention_settings.rb +45 -0
- data/lib/source_monitor/configuration/scraper_registry.rb +67 -0
- data/lib/source_monitor/configuration/scraping_settings.rb +39 -0
- data/lib/source_monitor/configuration/validation_definition.rb +32 -0
- data/lib/source_monitor/configuration.rb +12 -579
- data/lib/source_monitor/dashboard/queries/recent_activity_query.rb +138 -0
- data/lib/source_monitor/dashboard/queries/stats_query.rb +71 -0
- data/lib/source_monitor/dashboard/queries.rb +2 -195
- data/lib/source_monitor/engine.rb +2 -0
- data/lib/source_monitor/fetching/feed_fetcher/adaptive_interval.rb +141 -0
- data/lib/source_monitor/fetching/feed_fetcher/entry_processor.rb +89 -0
- data/lib/source_monitor/fetching/feed_fetcher/source_updater.rb +200 -0
- data/lib/source_monitor/fetching/feed_fetcher.rb +37 -379
- data/lib/source_monitor/items/item_creator/content_extractor.rb +113 -0
- data/lib/source_monitor/items/item_creator/entry_parser/media_extraction.rb +96 -0
- data/lib/source_monitor/items/item_creator/entry_parser.rb +294 -0
- data/lib/source_monitor/items/item_creator.rb +28 -455
- data/lib/source_monitor/setup/bundle_installer.rb +2 -0
- data/lib/source_monitor/setup/cli.rb +2 -0
- data/lib/source_monitor/setup/dependency_checker.rb +2 -0
- data/lib/source_monitor/setup/detectors.rb +2 -0
- data/lib/source_monitor/setup/gemfile_editor.rb +2 -0
- data/lib/source_monitor/setup/initializer_patcher.rb +2 -0
- data/lib/source_monitor/setup/install_generator.rb +2 -0
- data/lib/source_monitor/setup/migration_installer.rb +2 -0
- data/lib/source_monitor/setup/node_installer.rb +2 -0
- data/lib/source_monitor/setup/prompter.rb +2 -0
- data/lib/source_monitor/setup/requirements.rb +2 -0
- data/lib/source_monitor/setup/shell_runner.rb +2 -0
- data/lib/source_monitor/setup/verification/action_cable_verifier.rb +2 -0
- data/lib/source_monitor/setup/verification/printer.rb +2 -0
- data/lib/source_monitor/setup/verification/result.rb +2 -0
- data/lib/source_monitor/setup/verification/runner.rb +2 -0
- data/lib/source_monitor/setup/verification/solid_queue_verifier.rb +2 -0
- data/lib/source_monitor/setup/verification/telemetry_logger.rb +2 -0
- data/lib/source_monitor/setup/workflow.rb +2 -0
- data/lib/source_monitor/version.rb +3 -1
- data/lib/source_monitor.rb +140 -58
- data/lib/tasks/source_monitor_assets.rake +2 -0
- data/lib/tasks/source_monitor_setup.rake +2 -0
- data/lib/tasks/source_monitor_tasks.rake +2 -0
- data/source_monitor.gemspec +3 -1
- metadata +144 -4
|
@@ -0,0 +1,32 @@
|
|
|
1
|
+
# frozen_string_literal: true
|
|
2
|
+
|
|
3
|
+
module SourceMonitor
|
|
4
|
+
class Configuration
|
|
5
|
+
class ValidationDefinition
|
|
6
|
+
attr_reader :handler, :options
|
|
7
|
+
|
|
8
|
+
def initialize(handler, options)
|
|
9
|
+
@handler = handler
|
|
10
|
+
@options = options
|
|
11
|
+
end
|
|
12
|
+
|
|
13
|
+
def signature
|
|
14
|
+
handler_key =
|
|
15
|
+
case handler
|
|
16
|
+
when Symbol
|
|
17
|
+
[ :symbol, handler ]
|
|
18
|
+
when String
|
|
19
|
+
[ :symbol, handler.to_sym ]
|
|
20
|
+
else
|
|
21
|
+
[ :callable, handler.object_id ]
|
|
22
|
+
end
|
|
23
|
+
|
|
24
|
+
[ handler_key, options ]
|
|
25
|
+
end
|
|
26
|
+
|
|
27
|
+
def symbol?
|
|
28
|
+
handler.is_a?(Symbol) || handler.is_a?(String)
|
|
29
|
+
end
|
|
30
|
+
end
|
|
31
|
+
end
|
|
32
|
+
end
|
|
@@ -1,6 +1,18 @@
|
|
|
1
1
|
# frozen_string_literal: true
|
|
2
2
|
|
|
3
3
|
require "active_support/core_ext/string/inflections"
|
|
4
|
+
require "source_monitor/configuration/http_settings"
|
|
5
|
+
require "source_monitor/configuration/fetching_settings"
|
|
6
|
+
require "source_monitor/configuration/health_settings"
|
|
7
|
+
require "source_monitor/configuration/scraping_settings"
|
|
8
|
+
require "source_monitor/configuration/realtime_settings"
|
|
9
|
+
require "source_monitor/configuration/retention_settings"
|
|
10
|
+
require "source_monitor/configuration/authentication_settings"
|
|
11
|
+
require "source_monitor/configuration/scraper_registry"
|
|
12
|
+
require "source_monitor/configuration/events"
|
|
13
|
+
require "source_monitor/configuration/validation_definition"
|
|
14
|
+
require "source_monitor/configuration/model_definition"
|
|
15
|
+
require "source_monitor/configuration/models"
|
|
4
16
|
|
|
5
17
|
module SourceMonitor
|
|
6
18
|
class Configuration
|
|
@@ -71,584 +83,5 @@ module SourceMonitor
|
|
|
71
83
|
raise ArgumentError, "unknown queue role #{role.inspect}"
|
|
72
84
|
end
|
|
73
85
|
end
|
|
74
|
-
|
|
75
|
-
class AuthenticationSettings
|
|
76
|
-
Handler = Struct.new(:type, :callable) do
|
|
77
|
-
def call(controller)
|
|
78
|
-
return unless callable
|
|
79
|
-
|
|
80
|
-
case type
|
|
81
|
-
when :symbol
|
|
82
|
-
controller.public_send(callable)
|
|
83
|
-
when :callable
|
|
84
|
-
arity = callable.arity
|
|
85
|
-
if arity.zero?
|
|
86
|
-
controller.instance_exec(&callable)
|
|
87
|
-
else
|
|
88
|
-
callable.call(controller)
|
|
89
|
-
end
|
|
90
|
-
end
|
|
91
|
-
end
|
|
92
|
-
end
|
|
93
|
-
|
|
94
|
-
attr_reader :authenticate_handler, :authorize_handler
|
|
95
|
-
attr_accessor :current_user_method, :user_signed_in_method
|
|
96
|
-
|
|
97
|
-
def initialize
|
|
98
|
-
reset!
|
|
99
|
-
end
|
|
100
|
-
|
|
101
|
-
def authenticate_with(handler = nil, &block)
|
|
102
|
-
@authenticate_handler = build_handler(handler, &block)
|
|
103
|
-
end
|
|
104
|
-
|
|
105
|
-
def authorize_with(handler = nil, &block)
|
|
106
|
-
@authorize_handler = build_handler(handler, &block)
|
|
107
|
-
end
|
|
108
|
-
|
|
109
|
-
def reset!
|
|
110
|
-
@authenticate_handler = nil
|
|
111
|
-
@authorize_handler = nil
|
|
112
|
-
@current_user_method = nil
|
|
113
|
-
@user_signed_in_method = nil
|
|
114
|
-
end
|
|
115
|
-
|
|
116
|
-
private
|
|
117
|
-
|
|
118
|
-
def build_handler(handler = nil, &block)
|
|
119
|
-
handler ||= block
|
|
120
|
-
return nil unless handler
|
|
121
|
-
|
|
122
|
-
if handler.is_a?(Symbol) || handler.is_a?(String)
|
|
123
|
-
Handler.new(:symbol, handler.to_sym)
|
|
124
|
-
elsif handler.respond_to?(:call)
|
|
125
|
-
Handler.new(:callable, handler)
|
|
126
|
-
else
|
|
127
|
-
raise ArgumentError, "Invalid authentication handler #{handler.inspect}"
|
|
128
|
-
end
|
|
129
|
-
end
|
|
130
|
-
end
|
|
131
|
-
|
|
132
|
-
class ScrapingSettings
|
|
133
|
-
attr_accessor :max_in_flight_per_source, :max_bulk_batch_size
|
|
134
|
-
|
|
135
|
-
DEFAULT_MAX_IN_FLIGHT = 25
|
|
136
|
-
DEFAULT_MAX_BULK_BATCH_SIZE = 100
|
|
137
|
-
|
|
138
|
-
def initialize
|
|
139
|
-
reset!
|
|
140
|
-
end
|
|
141
|
-
|
|
142
|
-
def reset!
|
|
143
|
-
@max_in_flight_per_source = DEFAULT_MAX_IN_FLIGHT
|
|
144
|
-
@max_bulk_batch_size = DEFAULT_MAX_BULK_BATCH_SIZE
|
|
145
|
-
end
|
|
146
|
-
|
|
147
|
-
def max_in_flight_per_source=(value)
|
|
148
|
-
@max_in_flight_per_source = normalize_numeric(value)
|
|
149
|
-
end
|
|
150
|
-
|
|
151
|
-
def max_bulk_batch_size=(value)
|
|
152
|
-
@max_bulk_batch_size = normalize_numeric(value)
|
|
153
|
-
end
|
|
154
|
-
|
|
155
|
-
private
|
|
156
|
-
|
|
157
|
-
def normalize_numeric(value)
|
|
158
|
-
return nil if value.nil?
|
|
159
|
-
return nil if value == ""
|
|
160
|
-
|
|
161
|
-
integer = value.respond_to?(:to_i) ? value.to_i : value
|
|
162
|
-
integer.positive? ? integer : nil
|
|
163
|
-
end
|
|
164
|
-
end
|
|
165
|
-
|
|
166
|
-
class RealtimeSettings
|
|
167
|
-
VALID_ADAPTERS = %i[solid_cable redis async].freeze
|
|
168
|
-
|
|
169
|
-
attr_reader :adapter, :solid_cable
|
|
170
|
-
attr_accessor :redis_url
|
|
171
|
-
|
|
172
|
-
def initialize
|
|
173
|
-
reset!
|
|
174
|
-
end
|
|
175
|
-
|
|
176
|
-
def adapter=(value)
|
|
177
|
-
value = value&.to_sym
|
|
178
|
-
unless VALID_ADAPTERS.include?(value)
|
|
179
|
-
raise ArgumentError, "Unsupported realtime adapter #{value.inspect}"
|
|
180
|
-
end
|
|
181
|
-
|
|
182
|
-
@adapter = value
|
|
183
|
-
end
|
|
184
|
-
|
|
185
|
-
def reset!
|
|
186
|
-
@solid_cable = SolidCableOptions.new
|
|
187
|
-
@redis_url = nil
|
|
188
|
-
self.adapter = :solid_cable
|
|
189
|
-
end
|
|
190
|
-
|
|
191
|
-
def solid_cable=(options)
|
|
192
|
-
solid_cable.assign(options)
|
|
193
|
-
end
|
|
194
|
-
|
|
195
|
-
def action_cable_config
|
|
196
|
-
case adapter
|
|
197
|
-
when :solid_cable
|
|
198
|
-
solid_cable.to_h.merge(adapter: "solid_cable")
|
|
199
|
-
when :redis
|
|
200
|
-
config = { adapter: "redis" }
|
|
201
|
-
config[:url] = redis_url if redis_url.present?
|
|
202
|
-
config
|
|
203
|
-
when :async
|
|
204
|
-
{ adapter: "async" }
|
|
205
|
-
else
|
|
206
|
-
{}
|
|
207
|
-
end
|
|
208
|
-
end
|
|
209
|
-
|
|
210
|
-
class SolidCableOptions
|
|
211
|
-
attr_accessor :polling_interval,
|
|
212
|
-
:message_retention,
|
|
213
|
-
:autotrim,
|
|
214
|
-
:silence_polling,
|
|
215
|
-
:use_skip_locked,
|
|
216
|
-
:trim_batch_size,
|
|
217
|
-
:connects_to
|
|
218
|
-
|
|
219
|
-
def initialize
|
|
220
|
-
reset!
|
|
221
|
-
end
|
|
222
|
-
|
|
223
|
-
def assign(options)
|
|
224
|
-
return unless options.respond_to?(:each)
|
|
225
|
-
|
|
226
|
-
options.each do |key, value|
|
|
227
|
-
setter = "#{key}="
|
|
228
|
-
public_send(setter, value) if respond_to?(setter)
|
|
229
|
-
end
|
|
230
|
-
end
|
|
231
|
-
|
|
232
|
-
def reset!
|
|
233
|
-
@polling_interval = "0.1.seconds"
|
|
234
|
-
@message_retention = "1.day"
|
|
235
|
-
@autotrim = true
|
|
236
|
-
@silence_polling = true
|
|
237
|
-
@use_skip_locked = true
|
|
238
|
-
@trim_batch_size = nil
|
|
239
|
-
@connects_to = nil
|
|
240
|
-
end
|
|
241
|
-
|
|
242
|
-
def to_h
|
|
243
|
-
{
|
|
244
|
-
polling_interval: polling_interval,
|
|
245
|
-
message_retention: message_retention,
|
|
246
|
-
autotrim: autotrim,
|
|
247
|
-
silence_polling: silence_polling,
|
|
248
|
-
use_skip_locked: use_skip_locked,
|
|
249
|
-
trim_batch_size: trim_batch_size,
|
|
250
|
-
connects_to: connects_to
|
|
251
|
-
}.compact
|
|
252
|
-
end
|
|
253
|
-
end
|
|
254
|
-
end
|
|
255
|
-
|
|
256
|
-
class HTTPSettings
|
|
257
|
-
attr_accessor :timeout,
|
|
258
|
-
:open_timeout,
|
|
259
|
-
:max_redirects,
|
|
260
|
-
:user_agent,
|
|
261
|
-
:proxy,
|
|
262
|
-
:headers,
|
|
263
|
-
:retry_max,
|
|
264
|
-
:retry_interval,
|
|
265
|
-
:retry_interval_randomness,
|
|
266
|
-
:retry_backoff_factor,
|
|
267
|
-
:retry_statuses
|
|
268
|
-
|
|
269
|
-
def initialize
|
|
270
|
-
reset!
|
|
271
|
-
end
|
|
272
|
-
|
|
273
|
-
def reset!
|
|
274
|
-
@timeout = 15
|
|
275
|
-
@open_timeout = 5
|
|
276
|
-
@max_redirects = 5
|
|
277
|
-
@user_agent = default_user_agent
|
|
278
|
-
@proxy = nil
|
|
279
|
-
@headers = {}
|
|
280
|
-
@retry_max = 4
|
|
281
|
-
@retry_interval = 0.5
|
|
282
|
-
@retry_interval_randomness = 0.5
|
|
283
|
-
@retry_backoff_factor = 2
|
|
284
|
-
@retry_statuses = nil
|
|
285
|
-
end
|
|
286
|
-
|
|
287
|
-
private
|
|
288
|
-
|
|
289
|
-
def default_user_agent
|
|
290
|
-
"SourceMonitor/#{SourceMonitor::VERSION}"
|
|
291
|
-
end
|
|
292
|
-
end
|
|
293
|
-
|
|
294
|
-
class FetchingSettings
|
|
295
|
-
attr_accessor :min_interval_minutes,
|
|
296
|
-
:max_interval_minutes,
|
|
297
|
-
:increase_factor,
|
|
298
|
-
:decrease_factor,
|
|
299
|
-
:failure_increase_factor,
|
|
300
|
-
:jitter_percent
|
|
301
|
-
|
|
302
|
-
def initialize
|
|
303
|
-
reset!
|
|
304
|
-
end
|
|
305
|
-
|
|
306
|
-
def reset!
|
|
307
|
-
@min_interval_minutes = 5
|
|
308
|
-
@max_interval_minutes = 24 * 60
|
|
309
|
-
@increase_factor = 1.25
|
|
310
|
-
@decrease_factor = 0.75
|
|
311
|
-
@failure_increase_factor = 1.5
|
|
312
|
-
@jitter_percent = 0.1
|
|
313
|
-
end
|
|
314
|
-
end
|
|
315
|
-
|
|
316
|
-
class HealthSettings
|
|
317
|
-
attr_accessor :window_size,
|
|
318
|
-
:healthy_threshold,
|
|
319
|
-
:warning_threshold,
|
|
320
|
-
:auto_pause_threshold,
|
|
321
|
-
:auto_resume_threshold,
|
|
322
|
-
:auto_pause_cooldown_minutes
|
|
323
|
-
|
|
324
|
-
def initialize
|
|
325
|
-
reset!
|
|
326
|
-
end
|
|
327
|
-
|
|
328
|
-
def reset!
|
|
329
|
-
@window_size = 20
|
|
330
|
-
@healthy_threshold = 0.8
|
|
331
|
-
@warning_threshold = 0.5
|
|
332
|
-
@auto_pause_threshold = 0.2
|
|
333
|
-
@auto_resume_threshold = 0.6
|
|
334
|
-
@auto_pause_cooldown_minutes = 60
|
|
335
|
-
end
|
|
336
|
-
end
|
|
337
|
-
|
|
338
|
-
class ScraperRegistry
|
|
339
|
-
include Enumerable
|
|
340
|
-
|
|
341
|
-
def initialize
|
|
342
|
-
@adapters = {}
|
|
343
|
-
end
|
|
344
|
-
|
|
345
|
-
def register(name, adapter)
|
|
346
|
-
key = normalize_name(name)
|
|
347
|
-
@adapters[key] = normalize_adapter(adapter)
|
|
348
|
-
end
|
|
349
|
-
|
|
350
|
-
def unregister(name)
|
|
351
|
-
@adapters.delete(normalize_name(name))
|
|
352
|
-
end
|
|
353
|
-
|
|
354
|
-
def adapter_for(name)
|
|
355
|
-
adapter = @adapters[normalize_name(name)]
|
|
356
|
-
adapter if adapter
|
|
357
|
-
end
|
|
358
|
-
|
|
359
|
-
def each(&block)
|
|
360
|
-
@adapters.each(&block)
|
|
361
|
-
end
|
|
362
|
-
|
|
363
|
-
private
|
|
364
|
-
|
|
365
|
-
def normalize_name(name)
|
|
366
|
-
value = name.to_s
|
|
367
|
-
raise ArgumentError, "Invalid scraper adapter name #{name.inspect}" unless value.match?(/\A[a-z0-9_]+\z/i)
|
|
368
|
-
|
|
369
|
-
value.downcase
|
|
370
|
-
end
|
|
371
|
-
|
|
372
|
-
def normalize_adapter(adapter)
|
|
373
|
-
constant = resolve_adapter(adapter)
|
|
374
|
-
|
|
375
|
-
if defined?(SourceMonitor::Scrapers::Base) && !(constant <= SourceMonitor::Scrapers::Base)
|
|
376
|
-
raise ArgumentError, "Scraper adapters must inherit from SourceMonitor::Scrapers::Base"
|
|
377
|
-
end
|
|
378
|
-
|
|
379
|
-
constant
|
|
380
|
-
end
|
|
381
|
-
|
|
382
|
-
def resolve_adapter(adapter)
|
|
383
|
-
return adapter if adapter.is_a?(Class)
|
|
384
|
-
|
|
385
|
-
if adapter.respond_to?(:to_s)
|
|
386
|
-
constant_name = adapter.to_s
|
|
387
|
-
begin
|
|
388
|
-
return constant_name.constantize
|
|
389
|
-
rescue NameError
|
|
390
|
-
raise ArgumentError, "Unknown scraper adapter constant #{constant_name.inspect}"
|
|
391
|
-
end
|
|
392
|
-
end
|
|
393
|
-
|
|
394
|
-
raise ArgumentError, "Invalid scraper adapter #{adapter.inspect}"
|
|
395
|
-
end
|
|
396
|
-
end
|
|
397
|
-
|
|
398
|
-
class RetentionSettings
|
|
399
|
-
attr_accessor :items_retention_days, :max_items
|
|
400
|
-
|
|
401
|
-
def initialize
|
|
402
|
-
@items_retention_days = nil
|
|
403
|
-
@max_items = nil
|
|
404
|
-
@strategy = :destroy
|
|
405
|
-
end
|
|
406
|
-
|
|
407
|
-
def strategy
|
|
408
|
-
@strategy
|
|
409
|
-
end
|
|
410
|
-
|
|
411
|
-
def strategy=(value)
|
|
412
|
-
normalized = normalize_strategy(value)
|
|
413
|
-
@strategy = normalized unless normalized.nil?
|
|
414
|
-
end
|
|
415
|
-
|
|
416
|
-
private
|
|
417
|
-
|
|
418
|
-
def normalize_strategy(value)
|
|
419
|
-
return :destroy if value.nil?
|
|
420
|
-
|
|
421
|
-
if value.respond_to?(:to_sym)
|
|
422
|
-
candidate = value.to_sym
|
|
423
|
-
valid =
|
|
424
|
-
if defined?(SourceMonitor::Items::RetentionPruner::VALID_STRATEGIES)
|
|
425
|
-
SourceMonitor::Items::RetentionPruner::VALID_STRATEGIES
|
|
426
|
-
else
|
|
427
|
-
%i[destroy soft_delete]
|
|
428
|
-
end
|
|
429
|
-
|
|
430
|
-
raise ArgumentError, "Invalid retention strategy #{value.inspect}" unless valid.include?(candidate)
|
|
431
|
-
candidate
|
|
432
|
-
else
|
|
433
|
-
raise ArgumentError, "Invalid retention strategy #{value.inspect}"
|
|
434
|
-
end
|
|
435
|
-
end
|
|
436
|
-
end
|
|
437
|
-
|
|
438
|
-
class Events
|
|
439
|
-
CALLBACK_KEYS = %i[after_item_created after_item_scraped after_fetch_completed].freeze
|
|
440
|
-
|
|
441
|
-
def initialize
|
|
442
|
-
@callbacks = Hash.new { |hash, key| hash[key] = [] }
|
|
443
|
-
@item_processors = []
|
|
444
|
-
end
|
|
445
|
-
|
|
446
|
-
CALLBACK_KEYS.each do |key|
|
|
447
|
-
define_method(key) do |handler = nil, &block|
|
|
448
|
-
register_callback(key, handler, &block)
|
|
449
|
-
end
|
|
450
|
-
end
|
|
451
|
-
|
|
452
|
-
def register_item_processor(processor = nil, &block)
|
|
453
|
-
callable = processor || block
|
|
454
|
-
validate_callable!(callable, :item_processor)
|
|
455
|
-
@item_processors << callable
|
|
456
|
-
callable
|
|
457
|
-
end
|
|
458
|
-
|
|
459
|
-
def callbacks_for(name)
|
|
460
|
-
@callbacks[name.to_sym]&.dup || []
|
|
461
|
-
end
|
|
462
|
-
|
|
463
|
-
def item_processors
|
|
464
|
-
@item_processors.dup
|
|
465
|
-
end
|
|
466
|
-
|
|
467
|
-
def reset!
|
|
468
|
-
@callbacks.clear
|
|
469
|
-
@item_processors.clear
|
|
470
|
-
end
|
|
471
|
-
|
|
472
|
-
private
|
|
473
|
-
|
|
474
|
-
def register_callback(key, handler = nil, &block)
|
|
475
|
-
callable = handler || block
|
|
476
|
-
validate_callable!(callable, key)
|
|
477
|
-
key = key.to_sym
|
|
478
|
-
unless CALLBACK_KEYS.include?(key)
|
|
479
|
-
raise ArgumentError, "Unknown event #{key.inspect}"
|
|
480
|
-
end
|
|
481
|
-
|
|
482
|
-
@callbacks[key] << callable
|
|
483
|
-
callable
|
|
484
|
-
end
|
|
485
|
-
|
|
486
|
-
def validate_callable!(callable, name)
|
|
487
|
-
unless callable.respond_to?(:call)
|
|
488
|
-
raise ArgumentError, "#{name} handler must respond to #call"
|
|
489
|
-
end
|
|
490
|
-
end
|
|
491
|
-
end
|
|
492
|
-
|
|
493
|
-
class Models
|
|
494
|
-
MODEL_KEYS = {
|
|
495
|
-
source: :source,
|
|
496
|
-
item: :item,
|
|
497
|
-
fetch_log: :fetch_log,
|
|
498
|
-
scrape_log: :scrape_log,
|
|
499
|
-
health_check_log: :health_check_log,
|
|
500
|
-
item_content: :item_content,
|
|
501
|
-
log_entry: :log_entry
|
|
502
|
-
}.freeze
|
|
503
|
-
|
|
504
|
-
attr_accessor :table_name_prefix
|
|
505
|
-
|
|
506
|
-
def initialize
|
|
507
|
-
@table_name_prefix = "sourcemon_"
|
|
508
|
-
@definitions = MODEL_KEYS.transform_values { ModelDefinition.new }
|
|
509
|
-
end
|
|
510
|
-
|
|
511
|
-
MODEL_KEYS.each do |method_name, key|
|
|
512
|
-
define_method(method_name) { @definitions[key] }
|
|
513
|
-
end
|
|
514
|
-
|
|
515
|
-
def for(name)
|
|
516
|
-
key = name.to_sym
|
|
517
|
-
definition = @definitions[key]
|
|
518
|
-
raise ArgumentError, "Unknown model #{name.inspect}" unless definition
|
|
519
|
-
|
|
520
|
-
definition
|
|
521
|
-
end
|
|
522
|
-
end
|
|
523
|
-
|
|
524
|
-
class ModelDefinition
|
|
525
|
-
attr_reader :validations
|
|
526
|
-
|
|
527
|
-
def initialize
|
|
528
|
-
@concern_definitions = []
|
|
529
|
-
@validations = []
|
|
530
|
-
end
|
|
531
|
-
|
|
532
|
-
def include_concern(concern = nil, &block)
|
|
533
|
-
definition = ConcernDefinition.new(concern, block)
|
|
534
|
-
unless @concern_definitions.any? { |existing| existing.signature == definition.signature }
|
|
535
|
-
@concern_definitions << definition
|
|
536
|
-
end
|
|
537
|
-
|
|
538
|
-
definition.return_value
|
|
539
|
-
end
|
|
540
|
-
|
|
541
|
-
def each_concern
|
|
542
|
-
return enum_for(:each_concern) unless block_given?
|
|
543
|
-
|
|
544
|
-
@concern_definitions.each do |definition|
|
|
545
|
-
yield definition.signature, definition.resolve
|
|
546
|
-
end
|
|
547
|
-
end
|
|
548
|
-
|
|
549
|
-
def validate(handler = nil, **options, &block)
|
|
550
|
-
callable =
|
|
551
|
-
if block
|
|
552
|
-
block
|
|
553
|
-
elsif handler.respond_to?(:call) && !handler.is_a?(Symbol) && !handler.is_a?(String)
|
|
554
|
-
handler
|
|
555
|
-
elsif handler.is_a?(Symbol) || handler.is_a?(String)
|
|
556
|
-
handler.to_sym
|
|
557
|
-
else
|
|
558
|
-
raise ArgumentError, "Invalid validation handler #{handler.inspect}"
|
|
559
|
-
end
|
|
560
|
-
|
|
561
|
-
validation = ValidationDefinition.new(callable, options)
|
|
562
|
-
@validations << validation
|
|
563
|
-
validation
|
|
564
|
-
end
|
|
565
|
-
|
|
566
|
-
private
|
|
567
|
-
|
|
568
|
-
class ConcernDefinition
|
|
569
|
-
attr_reader :signature
|
|
570
|
-
|
|
571
|
-
def initialize(concern, block)
|
|
572
|
-
@resolver = build_resolver(concern, block)
|
|
573
|
-
@signature = build_signature(concern, block)
|
|
574
|
-
@return_value = determine_return_value(concern, block)
|
|
575
|
-
end
|
|
576
|
-
|
|
577
|
-
def resolve
|
|
578
|
-
@resolved ||= @resolver.call
|
|
579
|
-
end
|
|
580
|
-
|
|
581
|
-
def return_value
|
|
582
|
-
@return_value
|
|
583
|
-
end
|
|
584
|
-
|
|
585
|
-
private
|
|
586
|
-
|
|
587
|
-
def build_resolver(concern, block)
|
|
588
|
-
if block
|
|
589
|
-
mod = Module.new(&block)
|
|
590
|
-
-> { mod }
|
|
591
|
-
elsif concern.is_a?(Module)
|
|
592
|
-
-> { concern }
|
|
593
|
-
elsif concern.respond_to?(:to_s)
|
|
594
|
-
constant_name = concern.to_s
|
|
595
|
-
lambda do
|
|
596
|
-
constant_name.constantize
|
|
597
|
-
rescue NameError => error
|
|
598
|
-
raise ArgumentError, error.message
|
|
599
|
-
end
|
|
600
|
-
else
|
|
601
|
-
raise ArgumentError, "Invalid concern #{concern.inspect}"
|
|
602
|
-
end
|
|
603
|
-
end
|
|
604
|
-
|
|
605
|
-
def build_signature(concern, block)
|
|
606
|
-
if block
|
|
607
|
-
[ :anonymous_module, block.object_id ]
|
|
608
|
-
elsif concern.is_a?(Module)
|
|
609
|
-
[ :module, concern.object_id ]
|
|
610
|
-
else
|
|
611
|
-
[ :constant, concern.to_s ]
|
|
612
|
-
end
|
|
613
|
-
end
|
|
614
|
-
|
|
615
|
-
def determine_return_value(concern, block)
|
|
616
|
-
if block
|
|
617
|
-
resolve
|
|
618
|
-
elsif concern.is_a?(Module)
|
|
619
|
-
concern
|
|
620
|
-
else
|
|
621
|
-
concern
|
|
622
|
-
end
|
|
623
|
-
end
|
|
624
|
-
end
|
|
625
|
-
end
|
|
626
|
-
|
|
627
|
-
class ValidationDefinition
|
|
628
|
-
attr_reader :handler, :options
|
|
629
|
-
|
|
630
|
-
def initialize(handler, options)
|
|
631
|
-
@handler = handler
|
|
632
|
-
@options = options
|
|
633
|
-
end
|
|
634
|
-
|
|
635
|
-
def signature
|
|
636
|
-
handler_key =
|
|
637
|
-
case handler
|
|
638
|
-
when Symbol
|
|
639
|
-
[ :symbol, handler ]
|
|
640
|
-
when String
|
|
641
|
-
[ :symbol, handler.to_sym ]
|
|
642
|
-
else
|
|
643
|
-
[ :callable, handler.object_id ]
|
|
644
|
-
end
|
|
645
|
-
|
|
646
|
-
[ handler_key, options ]
|
|
647
|
-
end
|
|
648
|
-
|
|
649
|
-
def symbol?
|
|
650
|
-
handler.is_a?(Symbol) || handler.is_a?(String)
|
|
651
|
-
end
|
|
652
|
-
end
|
|
653
86
|
end
|
|
654
87
|
end
|