udata-hydra 2.2.2.dev7678__tar.gz → 2.2.2.dev7693__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (78) hide show
  1. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/PKG-INFO +1 -1
  2. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/pyproject.toml +1 -1
  3. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/analysis/csv.py +23 -5
  4. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/analysis/geojson.py +5 -1
  5. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/README.md +0 -0
  6. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/__init__.py +0 -0
  7. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/analysis/__init__.py +0 -0
  8. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/analysis/helpers.py +0 -0
  9. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/analysis/resource.py +0 -0
  10. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/app.py +0 -0
  11. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/cli.py +0 -0
  12. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/config_default.toml +0 -0
  13. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/context.py +0 -0
  14. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/crawl/__init__.py +0 -0
  15. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/crawl/calculate_next_check.py +0 -0
  16. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/crawl/check_resources.py +0 -0
  17. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/crawl/helpers.py +0 -0
  18. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/crawl/preprocess_check_data.py +0 -0
  19. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/crawl/select_batch.py +0 -0
  20. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/db/__init__.py +0 -0
  21. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/db/check.py +0 -0
  22. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/db/resource.py +0 -0
  23. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/db/resource_exception.py +0 -0
  24. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/logger.py +0 -0
  25. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/__init__.py +0 -0
  26. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/csv/20221205_initial_up_rev1.sql +0 -0
  27. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/csv/20230130_drop_migrations.sql +0 -0
  28. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/csv/20230206_datetime_aware.sql +0 -0
  29. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/csv/20240827_add_indexes_column_to_tables_index_table.sql +0 -0
  30. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/csv/20250610_migrate_resources_exception.sql +0 -0
  31. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/csv/20250626_delete_datetime_iso_references.sql +0 -0
  32. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20221205_initial_up_rev1.sql +0 -0
  33. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20221206_rev1_up_rev2.sql +0 -0
  34. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20221206_rev2_up_rev3.sql +0 -0
  35. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20221208_rev3_up_rev4.sql +0 -0
  36. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20221208_rev4_up_rev5.sql +0 -0
  37. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20230119_rev5_up_rev6.sql +0 -0
  38. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20230121_rev6_up_rev7.sql +0 -0
  39. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20230121_rev7_up_rev8.sql +0 -0
  40. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20230130_drop_migrations.sql +0 -0
  41. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20230206_datetime_aware.sql +0 -0
  42. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20230515_rev8_up_rev9.sql +0 -0
  43. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20230606_rev9_up_rev10.sql +0 -0
  44. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20231102_drop_csv_analysis.sql +0 -0
  45. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20240827_add_resources_exceptions_table.sql +0 -0
  46. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20240926_add_indexes.sql +0 -0
  47. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20241004_add_comment_column_to_resources_exceptions.sql +0 -0
  48. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20241021_add_parquet_columns.sql +0 -0
  49. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20241023_alter_foreign_key.sql +0 -0
  50. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20241025_add_next_check_column.sql +0 -0
  51. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20250108_add_indexes.sql +0 -0
  52. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20250130_add_pmtiles_fields.sql +0 -0
  53. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20250519_add_format_column_catalog.sql +0 -0
  54. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20250610_migrate_resources_exception.sql +0 -0
  55. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20250611_add_status_since_catalog.sql +0 -0
  56. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/migrations/main/20250615_add_geojson_fields.sql +0 -0
  57. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/routes/__init__.py +0 -0
  58. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/routes/checks.py +0 -0
  59. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/routes/resources.py +0 -0
  60. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/routes/resources_exceptions.py +0 -0
  61. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/routes/status.py +0 -0
  62. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/schemas/__init__.py +0 -0
  63. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/schemas/check.py +0 -0
  64. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/schemas/resource.py +0 -0
  65. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/schemas/resource_exception.py +0 -0
  66. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/utils/__init__.py +0 -0
  67. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/utils/auth.py +0 -0
  68. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/utils/csv.py +0 -0
  69. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/utils/db.py +0 -0
  70. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/utils/errors.py +0 -0
  71. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/utils/file.py +0 -0
  72. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/utils/geojson.py +0 -0
  73. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/utils/http.py +0 -0
  74. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/utils/minio.py +0 -0
  75. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/utils/parquet.py +0 -0
  76. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/utils/queue.py +0 -0
  77. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/utils/timer.py +0 -0
  78. {udata_hydra-2.2.2.dev7678 → udata_hydra-2.2.2.dev7693}/udata_hydra/worker.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: udata-hydra
3
- Version: 2.2.2.dev7678
3
+ Version: 2.2.2.dev7693
4
4
  Summary: Async crawler and parsing service for data.gouv.fr
5
5
  License: MIT
6
6
  Author: Opendata Team
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "udata-hydra"
3
- version = "2.2.2.dev7678"
3
+ version = "2.2.2.dev7693"
4
4
  description = "Async crawler and parsing service for data.gouv.fr"
5
5
  authors = [{ name = "Opendata Team", email = "opendatateam@data.gouv.fr" }]
6
6
  dependencies = [
@@ -139,7 +139,11 @@ async def analyse_csv(
139
139
  )
140
140
  except Exception as e:
141
141
  raise ParseException(
142
- step="csv_detective", resource_id=resource_id, url=url, check_id=check["id"]
142
+ message=str(e),
143
+ step="csv_detective",
144
+ resource_id=resource_id,
145
+ url=url,
146
+ check_id=check["id"],
143
147
  ) from e
144
148
  timer.mark("csv-inspection")
145
149
 
@@ -163,7 +167,11 @@ async def analyse_csv(
163
167
  except Exception as e:
164
168
  remove_remainders(resource_id, ["parquet"])
165
169
  raise ParseException(
166
- step="parquet_export", resource_id=resource_id, url=url, check_id=check["id"]
170
+ message=str(e),
171
+ step="parquet_export",
172
+ resource_id=resource_id,
173
+ url=url,
174
+ check_id=check["id"],
167
175
  ) from e
168
176
 
169
177
  try:
@@ -176,7 +184,11 @@ async def analyse_csv(
176
184
  except Exception as e:
177
185
  remove_remainders(resource_id, ["geojson", "pmtiles", "pmtiles-journal"])
178
186
  raise ParseException(
179
- step="geojson_export", resource_id=resource_id, url=url, check_id=check["id"]
187
+ message=str(e),
188
+ step="geojson_export",
189
+ resource_id=resource_id,
190
+ url=url,
191
+ check_id=check["id"],
180
192
  ) from e
181
193
 
182
194
  check = await Check.update(
@@ -381,7 +393,10 @@ async def csv_to_db(
381
393
  await db.execute(q)
382
394
  except Exception as e:
383
395
  raise ParseException(
384
- step="create_table_query", resource_id=resource_id, table_name=table_name
396
+ message=str(e),
397
+ step="create_table_query",
398
+ resource_id=resource_id,
399
+ table_name=table_name,
385
400
  ) from e
386
401
 
387
402
  # this use postgresql COPY from an iterator, it's fast but might be difficult to debug
@@ -395,7 +410,10 @@ async def csv_to_db(
395
410
  )
396
411
  except Exception as e: # I know what I'm doing, pinky swear
397
412
  raise ParseException(
398
- step="copy_records_to_table", resource_id=resource_id, table_name=table_name
413
+ message=str(e),
414
+ step="copy_records_to_table",
415
+ resource_id=resource_id,
416
+ table_name=table_name,
399
417
  ) from e
400
418
  # this inserts rows from iterator one by one, slow but useful for debugging
401
419
  else:
@@ -71,7 +71,11 @@ async def analyse_geojson(
71
71
  timer.mark("geojson-to-pmtiles")
72
72
  except Exception as e:
73
73
  raise ParseException(
74
- step="pmtiles_export", resource_id=resource_id, url=url, check_id=check["id"]
74
+ message=str(e),
75
+ step="pmtiles_export",
76
+ resource_id=resource_id,
77
+ url=url,
78
+ check_id=check["id"],
75
79
  ) from e
76
80
 
77
81
  check = await Check.update(