udata-hydra 2.4.1.dev9596__tar.gz → 2.4.2.dev9635__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/PKG-INFO +1 -1
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/pyproject.toml +1 -1
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/__init__.py +7 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/config_default.toml +1 -1
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/crawl/check_resources.py +2 -1
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/routes/checks.py +2 -1
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/utils/file.py +1 -1
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/utils/http.py +1 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/README.md +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/analysis/__init__.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/analysis/csv.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/analysis/geojson.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/analysis/helpers.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/analysis/resource.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/app.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/cli.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/context.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/crawl/__init__.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/crawl/calculate_next_check.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/crawl/helpers.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/crawl/preprocess_check_data.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/crawl/select_batch.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/db/__init__.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/db/check.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/db/resource.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/db/resource_exception.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/logger.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/__init__.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/csv/20221205_initial_up_rev1.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/csv/20230130_drop_migrations.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/csv/20230206_datetime_aware.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/csv/20240827_add_indexes_column_to_tables_index_table.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/csv/20250610_migrate_resources_exception.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/csv/20250626_delete_datetime_iso_references.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/csv/20250902_delete_analyses_too_long_column_names.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20221205_initial_up_rev1.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20221206_rev1_up_rev2.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20221206_rev2_up_rev3.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20221208_rev3_up_rev4.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20221208_rev4_up_rev5.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20230119_rev5_up_rev6.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20230121_rev6_up_rev7.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20230121_rev7_up_rev8.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20230130_drop_migrations.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20230206_datetime_aware.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20230515_rev8_up_rev9.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20230606_rev9_up_rev10.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20231102_drop_csv_analysis.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20240827_add_resources_exceptions_table.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20240926_add_indexes.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20241004_add_comment_column_to_resources_exceptions.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20241021_add_parquet_columns.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20241023_alter_foreign_key.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20241025_add_next_check_column.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20250108_add_indexes.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20250130_add_pmtiles_fields.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20250519_add_format_column_catalog.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20250610_migrate_resources_exception.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20250611_add_status_since_catalog.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/migrations/main/20250615_add_geojson_fields.sql +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/routes/__init__.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/routes/resources.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/routes/resources_exceptions.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/routes/status.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/schemas/__init__.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/schemas/check.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/schemas/resource.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/schemas/resource_exception.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/utils/__init__.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/utils/auth.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/utils/csv.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/utils/db.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/utils/errors.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/utils/geojson.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/utils/minio.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/utils/parquet.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/utils/queue.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/utils/timer.py +0 -0
- {udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/worker.py +0 -0
|
@@ -49,5 +49,12 @@ class Configurator:
|
|
|
49
49
|
def __dict__(self):
|
|
50
50
|
return self.configuration
|
|
51
51
|
|
|
52
|
+
@property
|
|
53
|
+
def USER_AGENT_FULL(self) -> str:
|
|
54
|
+
"""Build the complete user agent string with version"""
|
|
55
|
+
if self.USER_AGENT and self.APP_VERSION:
|
|
56
|
+
return f"{self.USER_AGENT}/{self.APP_VERSION}"
|
|
57
|
+
return "udata-hydra"
|
|
58
|
+
|
|
52
59
|
|
|
53
60
|
config = Configurator()
|
|
@@ -13,7 +13,7 @@ SENTRY_SAMPLE_RATE = 1.0
|
|
|
13
13
|
TESTING = false
|
|
14
14
|
# max postgres pool size
|
|
15
15
|
MAX_POOL_SIZE = 50
|
|
16
|
-
USER_AGENT = "udata-hydra
|
|
16
|
+
USER_AGENT = "udata-hydra" # without version - version is dynamically added
|
|
17
17
|
NAMEDATALEN = 64 # should be set to the same value as in Postgres, but we can't query it
|
|
18
18
|
|
|
19
19
|
API_KEY = "hydra_api_key_to_change"
|
{udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/crawl/check_resources.py
RENAMED
|
@@ -36,7 +36,8 @@ async def check_batch_resources(to_parse: list[Record]) -> None:
|
|
|
36
36
|
context.monitor().set_status("Checking resources...")
|
|
37
37
|
tasks: list = []
|
|
38
38
|
async with aiohttp.ClientSession(
|
|
39
|
-
timeout=None,
|
|
39
|
+
timeout=None,
|
|
40
|
+
headers={"user-agent": config.USER_AGENT_FULL},
|
|
40
41
|
) as session:
|
|
41
42
|
for row in to_parse:
|
|
42
43
|
tasks.append(
|
|
@@ -77,7 +77,8 @@ async def create_check(request: web.Request) -> web.Response:
|
|
|
77
77
|
context.monitor().set_status(f'Crawling url "{url}"...')
|
|
78
78
|
|
|
79
79
|
async with aiohttp.ClientSession(
|
|
80
|
-
timeout=None,
|
|
80
|
+
timeout=None,
|
|
81
|
+
headers={"user-agent": config.USER_AGENT_FULL},
|
|
81
82
|
) as session:
|
|
82
83
|
status: str = await check_resource(
|
|
83
84
|
url=url,
|
|
@@ -60,7 +60,7 @@ async def download_resource(
|
|
|
60
60
|
too_large, download_error = False, None
|
|
61
61
|
try:
|
|
62
62
|
async with aiohttp.ClientSession(
|
|
63
|
-
headers={"user-agent": config.
|
|
63
|
+
headers={"user-agent": config.USER_AGENT_FULL},
|
|
64
64
|
raise_for_status=True,
|
|
65
65
|
) as session:
|
|
66
66
|
async with session.get(url, allow_redirects=True) as response:
|
|
@@ -79,6 +79,7 @@ async def send(dataset_id: str, resource_id: str, document: UdataPayload) -> Non
|
|
|
79
79
|
|
|
80
80
|
uri = f"{config.UDATA_URI}/datasets/{dataset_id}/resources/{resource_id}/extras/"
|
|
81
81
|
headers = {
|
|
82
|
+
"user-agent": config.USER_AGENT_FULL,
|
|
82
83
|
"content-type": "application/json",
|
|
83
84
|
"X-API-KEY": config.UDATA_URI_API_KEY,
|
|
84
85
|
}
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/crawl/calculate_next_check.py
RENAMED
|
File without changes
|
|
File without changes
|
{udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/crawl/preprocess_check_data.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/db/resource_exception.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/routes/resources_exceptions.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{udata_hydra-2.4.1.dev9596 → udata_hydra-2.4.2.dev9635}/udata_hydra/schemas/resource_exception.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|