data_drain 0.3.1 → 0.3.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +6 -0
- data/lib/data_drain/engine.rb +2 -2
- data/lib/data_drain/file_ingestor.rb +1 -1
- data/lib/data_drain/version.rb +1 -1
- metadata +3 -3
- /data/docs/execution/{v0.3.1-OBSERVACIONES.md → archive/v0.3.1-OBSERVACIONES.md} +0 -0
- /data/docs/execution/{v0.3.1.md → archive/v0.3.1.md} +0 -0
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA256:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: 6e7253dc94b9b7e2d000ba0c03b4e4d7692f12a26f16b422e71a884fa7a81efa
|
|
4
|
+
data.tar.gz: c1f9f7eb1e0e861c7d2e0dbf6ba6c66125a97bcbd90e175aa1a859e8c5a898fa
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: fdbf3431159bc83950adf972d68d8cff245bffa14481e0e2ef039a7959e3cbf884649c5bbaf40219a66a7ff0a8b24cad428001e5a7e05071873899bed3969b57
|
|
7
|
+
data.tar.gz: 3f5acffe028c91b472dd5de9b4e03f34954ca8c8cffeeb3e1f3f3b725b14a8f7df449ebc4b6cf6d7728a2a935f579ba403f2e72bfb53a6aadde1ca281c2698b2
|
data/CHANGELOG.md
CHANGED
|
@@ -1,5 +1,11 @@
|
|
|
1
1
|
## [Unreleased]
|
|
2
2
|
|
|
3
|
+
## [0.3.2] - 2026-04-15
|
|
4
|
+
|
|
5
|
+
### Regresiónfix (desde v0.3.1)
|
|
6
|
+
|
|
7
|
+
- `COUNT(*)` → `count()` (item 16 de v0.3.1) era incorrecto. `count()` sin argumentos es SQL inválido en Postgres. Se revierte a `COUNT(*)` en `Engine#get_postgres_count`, `Engine#verify_integrity` y `FileIngestor#step_count_source`. Ver [#10](https://github.com/gedera/data_drain/pull/10).
|
|
8
|
+
|
|
3
9
|
## [0.3.1] - 2026-04-15
|
|
4
10
|
|
|
5
11
|
### BREAKING (preventivo)
|
data/lib/data_drain/engine.rb
CHANGED
|
@@ -159,7 +159,7 @@ module DataDrain
|
|
|
159
159
|
# @api private
|
|
160
160
|
# @return [Integer]
|
|
161
161
|
def get_postgres_count
|
|
162
|
-
pg_sql = "SELECT
|
|
162
|
+
pg_sql = "SELECT COUNT(*) AS row_count FROM public.#{@table_name} WHERE #{base_where_sql}"
|
|
163
163
|
pg_sql = pg_sql.gsub("'", "''")
|
|
164
164
|
query = "SELECT row_count FROM postgres_query('pg_source', '#{pg_sql}')"
|
|
165
165
|
@duckdb.query(query).first.first
|
|
@@ -204,7 +204,7 @@ module DataDrain
|
|
|
204
204
|
|
|
205
205
|
begin
|
|
206
206
|
query = <<~SQL
|
|
207
|
-
SELECT
|
|
207
|
+
SELECT COUNT(*)
|
|
208
208
|
FROM read_parquet('#{archive_path}')
|
|
209
209
|
WHERE #{base_where_sql}
|
|
210
210
|
SQL
|
|
@@ -82,7 +82,7 @@ module DataDrain
|
|
|
82
82
|
|
|
83
83
|
# @api private
|
|
84
84
|
def step_count_source
|
|
85
|
-
source_count = timed(:source_query) { @duckdb.query("SELECT
|
|
85
|
+
source_count = timed(:source_query) { @duckdb.query("SELECT COUNT(*) FROM #{@reader_function}").first.first }
|
|
86
86
|
safe_log(:info, "file_ingestor.count", {
|
|
87
87
|
source_path: @source_path,
|
|
88
88
|
count: source_count,
|
data/lib/data_drain/version.rb
CHANGED
metadata
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: data_drain
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 0.3.
|
|
4
|
+
version: 0.3.2
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- Gabriel
|
|
@@ -102,9 +102,9 @@ files:
|
|
|
102
102
|
- docs/execution/archive/v0.2.0.md
|
|
103
103
|
- docs/execution/archive/v0.3.0-OBSERVACIONES.md
|
|
104
104
|
- docs/execution/archive/v0.3.0.md
|
|
105
|
+
- docs/execution/archive/v0.3.1-OBSERVACIONES.md
|
|
106
|
+
- docs/execution/archive/v0.3.1.md
|
|
105
107
|
- docs/execution/v0.2.2.md
|
|
106
|
-
- docs/execution/v0.3.1-OBSERVACIONES.md
|
|
107
|
-
- docs/execution/v0.3.1.md
|
|
108
108
|
- docs/glue_pyspark_example.py
|
|
109
109
|
- lib/data_drain.rb
|
|
110
110
|
- lib/data_drain/configuration.rb
|
|
File without changes
|
|
File without changes
|