csv-detective 0.8.1.dev1491__py3-none-any.whl → 0.8.1.dev1509__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- csv_detective/detect_fields/FR/other/code_csp_insee/code_csp_insee.txt +498 -0
- csv_detective/detect_fields/FR/other/csp_insee/csp_insee.txt +571 -0
- csv_detective/detect_fields/FR/other/insee_ape700/insee_ape700.txt +733 -0
- csv_detective/detect_fields/geo/iso_country_code_alpha2/iso_country_code_alpha2.txt +495 -0
- csv_detective/detect_fields/geo/iso_country_code_alpha3/iso_country_code_alpha3.txt +251 -0
- csv_detective/detect_fields/geo/iso_country_code_numeric/iso_country_code_numeric.txt +251 -0
- csv_detective/parsing/columns.py +1 -1
- {csv_detective-0.8.1.dev1491.data → csv_detective-0.8.1.dev1509.data}/data/share/csv_detective/CHANGELOG.md +2 -2
- {csv_detective-0.8.1.dev1491.dist-info → csv_detective-0.8.1.dev1509.dist-info}/METADATA +1 -1
- {csv_detective-0.8.1.dev1491.dist-info → csv_detective-0.8.1.dev1509.dist-info}/RECORD +17 -11
- tests/test_file.py +4 -5
- {csv_detective-0.8.1.dev1491.data → csv_detective-0.8.1.dev1509.data}/data/share/csv_detective/LICENSE +0 -0
- {csv_detective-0.8.1.dev1491.data → csv_detective-0.8.1.dev1509.data}/data/share/csv_detective/README.md +0 -0
- {csv_detective-0.8.1.dev1491.dist-info → csv_detective-0.8.1.dev1509.dist-info}/WHEEL +0 -0
- {csv_detective-0.8.1.dev1491.dist-info → csv_detective-0.8.1.dev1509.dist-info}/entry_points.txt +0 -0
- {csv_detective-0.8.1.dev1491.dist-info → csv_detective-0.8.1.dev1509.dist-info}/licenses/LICENSE +0 -0
- {csv_detective-0.8.1.dev1491.dist-info → csv_detective-0.8.1.dev1509.dist-info}/top_level.txt +0 -0
|
@@ -0,0 +1,251 @@
|
|
|
1
|
+
004
|
|
2
|
+
710
|
|
3
|
+
248
|
|
4
|
+
008
|
|
5
|
+
012
|
|
6
|
+
276
|
|
7
|
+
020
|
|
8
|
+
024
|
|
9
|
+
660
|
|
10
|
+
010
|
|
11
|
+
028
|
|
12
|
+
682
|
|
13
|
+
032
|
|
14
|
+
051
|
|
15
|
+
533
|
|
16
|
+
036
|
|
17
|
+
040
|
|
18
|
+
031
|
|
19
|
+
044
|
|
20
|
+
048
|
|
21
|
+
050
|
|
22
|
+
052
|
|
23
|
+
112
|
|
24
|
+
056
|
|
25
|
+
084
|
|
26
|
+
204
|
|
27
|
+
060
|
|
28
|
+
064
|
|
29
|
+
068
|
|
30
|
+
535
|
|
31
|
+
070
|
|
32
|
+
072
|
|
33
|
+
074
|
|
34
|
+
076
|
|
35
|
+
096
|
|
36
|
+
100
|
|
37
|
+
854
|
|
38
|
+
108
|
|
39
|
+
136
|
|
40
|
+
116
|
|
41
|
+
120
|
|
42
|
+
124
|
|
43
|
+
132
|
|
44
|
+
140
|
|
45
|
+
152
|
|
46
|
+
156
|
|
47
|
+
162
|
|
48
|
+
196
|
|
49
|
+
166
|
|
50
|
+
170
|
|
51
|
+
174
|
|
52
|
+
178
|
|
53
|
+
180
|
|
54
|
+
184
|
|
55
|
+
410
|
|
56
|
+
408
|
|
57
|
+
188
|
|
58
|
+
384
|
|
59
|
+
191
|
|
60
|
+
192
|
|
61
|
+
531
|
|
62
|
+
208
|
|
63
|
+
262
|
|
64
|
+
214
|
|
65
|
+
212
|
|
66
|
+
818
|
|
67
|
+
Gum
|
|
68
|
+
(Ré
|
|
69
|
+
222
|
|
70
|
+
784
|
|
71
|
+
218
|
|
72
|
+
232
|
|
73
|
+
724
|
|
74
|
+
233
|
|
75
|
+
840
|
|
76
|
+
231
|
|
77
|
+
238
|
|
78
|
+
234
|
|
79
|
+
242
|
|
80
|
+
246
|
|
81
|
+
250
|
|
82
|
+
266
|
|
83
|
+
270
|
|
84
|
+
268
|
|
85
|
+
239
|
|
86
|
+
288
|
|
87
|
+
292
|
|
88
|
+
300
|
|
89
|
+
308
|
|
90
|
+
304
|
|
91
|
+
312
|
|
92
|
+
316
|
|
93
|
+
320
|
|
94
|
+
831
|
|
95
|
+
324
|
|
96
|
+
624
|
|
97
|
+
226
|
|
98
|
+
328
|
|
99
|
+
254
|
|
100
|
+
332
|
|
101
|
+
334
|
|
102
|
+
340
|
|
103
|
+
344
|
|
104
|
+
348
|
|
105
|
+
833
|
|
106
|
+
581
|
|
107
|
+
092
|
|
108
|
+
850
|
|
109
|
+
356
|
|
110
|
+
360
|
|
111
|
+
364
|
|
112
|
+
368
|
|
113
|
+
372
|
|
114
|
+
352
|
|
115
|
+
376
|
|
116
|
+
380
|
|
117
|
+
388
|
|
118
|
+
392
|
|
119
|
+
832
|
|
120
|
+
400
|
|
121
|
+
398
|
|
122
|
+
404
|
|
123
|
+
417
|
|
124
|
+
296
|
|
125
|
+
414
|
|
126
|
+
418
|
|
127
|
+
426
|
|
128
|
+
428
|
|
129
|
+
422
|
|
130
|
+
430
|
|
131
|
+
434
|
|
132
|
+
438
|
|
133
|
+
440
|
|
134
|
+
442
|
|
135
|
+
446
|
|
136
|
+
807
|
|
137
|
+
450
|
|
138
|
+
458
|
|
139
|
+
454
|
|
140
|
+
462
|
|
141
|
+
466
|
|
142
|
+
470
|
|
143
|
+
580
|
|
144
|
+
504
|
|
145
|
+
584
|
|
146
|
+
474
|
|
147
|
+
480
|
|
148
|
+
478
|
|
149
|
+
175
|
|
150
|
+
484
|
|
151
|
+
583
|
|
152
|
+
498
|
|
153
|
+
492
|
|
154
|
+
496
|
|
155
|
+
499
|
|
156
|
+
500
|
|
157
|
+
508
|
|
158
|
+
104
|
|
159
|
+
516
|
|
160
|
+
520
|
|
161
|
+
524
|
|
162
|
+
558
|
|
163
|
+
562
|
|
164
|
+
566
|
|
165
|
+
570
|
|
166
|
+
574
|
|
167
|
+
578
|
|
168
|
+
540
|
|
169
|
+
554
|
|
170
|
+
086
|
|
171
|
+
512
|
|
172
|
+
800
|
|
173
|
+
860
|
|
174
|
+
586
|
|
175
|
+
585
|
|
176
|
+
275
|
|
177
|
+
591
|
|
178
|
+
598
|
|
179
|
+
600
|
|
180
|
+
528
|
|
181
|
+
604
|
|
182
|
+
608
|
|
183
|
+
612
|
|
184
|
+
616
|
|
185
|
+
258
|
|
186
|
+
630
|
|
187
|
+
620
|
|
188
|
+
634
|
|
189
|
+
638
|
|
190
|
+
642
|
|
191
|
+
826
|
|
192
|
+
643
|
|
193
|
+
646
|
|
194
|
+
732
|
|
195
|
+
652
|
|
196
|
+
659
|
|
197
|
+
674
|
|
198
|
+
663
|
|
199
|
+
534
|
|
200
|
+
666
|
|
201
|
+
336
|
|
202
|
+
670
|
|
203
|
+
654
|
|
204
|
+
662
|
|
205
|
+
090
|
|
206
|
+
882
|
|
207
|
+
016
|
|
208
|
+
678
|
|
209
|
+
686
|
|
210
|
+
688
|
|
211
|
+
690
|
|
212
|
+
694
|
|
213
|
+
702
|
|
214
|
+
703
|
|
215
|
+
705
|
|
216
|
+
706
|
|
217
|
+
729
|
|
218
|
+
728
|
|
219
|
+
144
|
|
220
|
+
752
|
|
221
|
+
756
|
|
222
|
+
740
|
|
223
|
+
744
|
|
224
|
+
748
|
|
225
|
+
760
|
|
226
|
+
762
|
|
227
|
+
158
|
|
228
|
+
834
|
|
229
|
+
148
|
|
230
|
+
203
|
|
231
|
+
260
|
|
232
|
+
764
|
|
233
|
+
626
|
|
234
|
+
768
|
|
235
|
+
772
|
|
236
|
+
776
|
|
237
|
+
780
|
|
238
|
+
788
|
|
239
|
+
795
|
|
240
|
+
796
|
|
241
|
+
792
|
|
242
|
+
798
|
|
243
|
+
804
|
|
244
|
+
858
|
|
245
|
+
548
|
|
246
|
+
862
|
|
247
|
+
704
|
|
248
|
+
876
|
|
249
|
+
887
|
|
250
|
+
894
|
|
251
|
+
716
|
csv_detective/parsing/columns.py
CHANGED
|
@@ -5,8 +5,8 @@
|
|
|
5
5
|
- Refactor label testing [#119](https://github.com/datagouv/csv-detective/pull/119)
|
|
6
6
|
- Refactor repo metadata and requirements [#120](https://github.com/datagouv/csv-detective/pull/120) [#122](https://github.com/datagouv/csv-detective/pull/122)
|
|
7
7
|
- Better URL detection [#121](https://github.com/datagouv/csv-detective/pull/121)
|
|
8
|
-
- For big files, analyse on sample then validate on whole file [#124](https://github.com/datagouv/csv-detective/pull/124)
|
|
9
|
-
- Fix imports [#125](https://github.com/datagouv/csv-detective/pull/125) [#126](https://github.com/datagouv/csv-detective/pull/126) [#127](https://github.com/datagouv/csv-detective/pull/127)
|
|
8
|
+
- For big files, analyse on sample then validate on whole file [#124](https://github.com/datagouv/csv-detective/pull/124) [#129](https://github.com/datagouv/csv-detective/pull/129)
|
|
9
|
+
- Fix imports [#125](https://github.com/datagouv/csv-detective/pull/125) [#126](https://github.com/datagouv/csv-detective/pull/126) [#127](https://github.com/datagouv/csv-detective/pull/127) [#128](https://github.com/datagouv/csv-detective/pull/128)
|
|
10
10
|
|
|
11
11
|
## 0.8.0 (2025-05-20)
|
|
12
12
|
|
|
@@ -25,12 +25,15 @@ csv_detective/detect_fields/FR/geo/pays/__init__.py,sha256=2q5T4SmCK6ZFF1mrv7d-q
|
|
|
25
25
|
csv_detective/detect_fields/FR/geo/region/__init__.py,sha256=JbFKDd4jAnd9yb7YqP36MoLdO1JFPm1cg60fGXt6ZvI,1074
|
|
26
26
|
csv_detective/detect_fields/FR/other/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
27
27
|
csv_detective/detect_fields/FR/other/code_csp_insee/__init__.py,sha256=SRWJvg3Ikyjmop9iL14igTjxNGpO-QB3fpADI_bLYEY,566
|
|
28
|
+
csv_detective/detect_fields/FR/other/code_csp_insee/code_csp_insee.txt,sha256=rbcjtMP6qTZ7BTU6ZegkiXKCruqY_m9Ep6ZgRabFS_E,2486
|
|
28
29
|
csv_detective/detect_fields/FR/other/code_import/__init__.py,sha256=zJ9YfPa5p--uHNQFeO1gTjxDy2Um_r-MxQd29VBNjFw,243
|
|
29
30
|
csv_detective/detect_fields/FR/other/code_rna/__init__.py,sha256=Z0RjMBt1--ZL7Jd1RsHAQCCbTAQk_BnlnTq8VF1o_VA,146
|
|
30
31
|
csv_detective/detect_fields/FR/other/code_waldec/__init__.py,sha256=41SYNzCzUFh4trQlwG-9UC0-1Wi4fTcv8Byi_dd9Lq4,168
|
|
31
32
|
csv_detective/detect_fields/FR/other/csp_insee/__init__.py,sha256=lvcaVKgOPrCaZb-Y1-wYCbLYB_CQjCJFNAzfWDwtTVE,496
|
|
33
|
+
csv_detective/detect_fields/FR/other/csp_insee/csp_insee.txt,sha256=kgKaKc-5PHu5U4--ugLjpFyMNtTU9CGdZ9ANU3YAsM4,32879
|
|
32
34
|
csv_detective/detect_fields/FR/other/date_fr/__init__.py,sha256=kMV52djlG0y4o0ELEZuvTv_FvooYOgTnV1aWhycFJDc,284
|
|
33
35
|
csv_detective/detect_fields/FR/other/insee_ape700/__init__.py,sha256=g8pOqJPKVpQiMd78zgrjXJWYeWkYhu8r3D4IQX519HQ,519
|
|
36
|
+
csv_detective/detect_fields/FR/other/insee_ape700/insee_ape700.txt,sha256=nKgslakENwgE7sPkVNHqR23iXuxF02p9-v5MC2_ntx8,4398
|
|
34
37
|
csv_detective/detect_fields/FR/other/sexe/__init__.py,sha256=iYkLe3MM51GWyBX_4BTq5PWDX_EeYRbEHWKMr8oE1MQ,269
|
|
35
38
|
csv_detective/detect_fields/FR/other/siren/__init__.py,sha256=ohSwUL2rXqTXPG5WDAh2SP-lp1SzFCYgo4IhJ-PXmdk,442
|
|
36
39
|
csv_detective/detect_fields/FR/other/siret/__init__.py,sha256=ThEeT6rXmS0EvHW8y4A_74bILyErDGxLe9v3elHOFs8,707
|
|
@@ -41,8 +44,11 @@ csv_detective/detect_fields/FR/temp/jour_de_la_semaine/__init__.py,sha256=TRJxFS
|
|
|
41
44
|
csv_detective/detect_fields/FR/temp/mois_de_annee/__init__.py,sha256=GuOnGw39Kz82bXId8mNzmlC4YkOrrf_F7f4g4uW_uvY,581
|
|
42
45
|
csv_detective/detect_fields/geo/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
43
46
|
csv_detective/detect_fields/geo/iso_country_code_alpha2/__init__.py,sha256=gbuzf_9yytZnmYYABk7vK3WinSU_AnrSxRpNQ7xroa8,433
|
|
47
|
+
csv_detective/detect_fields/geo/iso_country_code_alpha2/iso_country_code_alpha2.txt,sha256=YyPlDqCdz65ecf4Wes_r0P4rDSJG35niXtjc4MmctXM,1740
|
|
44
48
|
csv_detective/detect_fields/geo/iso_country_code_alpha3/__init__.py,sha256=u98rn_wuAGlGh2wN-t5syLBlCkqcxCAjpbvbBN8tov8,409
|
|
49
|
+
csv_detective/detect_fields/geo/iso_country_code_alpha3/iso_country_code_alpha3.txt,sha256=aYqKSohgXuBtcIBfF52f8JWYDdxL_HV_Ol1srGnWBp4,1003
|
|
45
50
|
csv_detective/detect_fields/geo/iso_country_code_numeric/__init__.py,sha256=wJAynAkGZN7jKeI3xOeLXQ_irxQBb_J56pRkLDYVClY,436
|
|
51
|
+
csv_detective/detect_fields/geo/iso_country_code_numeric/iso_country_code_numeric.txt,sha256=2GtEhuporsHYV-pU4q9kfXU5iOtfW5C0GYBTTKQtnnA,1004
|
|
46
52
|
csv_detective/detect_fields/geo/json_geojson/__init__.py,sha256=FPHOfTrfXJs62-NgeOcNGOvwPd7I1fEVp8lTdMNfj3w,433
|
|
47
53
|
csv_detective/detect_fields/geo/latitude_wgs/__init__.py,sha256=ArS6PuYEd0atZwSqNDZhXZz1TwzdiwdV8ovRYTOacpg,327
|
|
48
54
|
csv_detective/detect_fields/geo/latlon_wgs/__init__.py,sha256=7_mnO9uC_kI7e2WR8xIer7Kqw8zi-v-JKaAD4zcoGbE,342
|
|
@@ -137,25 +143,25 @@ csv_detective/output/profile.py,sha256=B8YU541T_YPDezJGh4dkHckOShiwHSrZd9GS8jbmz
|
|
|
137
143
|
csv_detective/output/schema.py,sha256=ZDBWDOD8IYp7rcB0_n8l9JXGIhOQ6bTZHFWfTmnNNEQ,13480
|
|
138
144
|
csv_detective/output/utils.py,sha256=HbmvCCCmFo7NJxhD_UsJIveuw-rrfhrvYckv1CJn_10,2301
|
|
139
145
|
csv_detective/parsing/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
140
|
-
csv_detective/parsing/columns.py,sha256=
|
|
146
|
+
csv_detective/parsing/columns.py,sha256=VzgG9Nwph5C_fLW_TuQC5BZVlPmOyjrH7Plvm_c8kWc,5675
|
|
141
147
|
csv_detective/parsing/compression.py,sha256=Fnw5tj-PpBNI8NYsWj5gD-DUoWcVLnsVpiKm9MpxmIA,350
|
|
142
148
|
csv_detective/parsing/csv.py,sha256=11mibDnJhIjykXLGZvA5ZEU5U7KgxIrbyO6BNv6jlro,1626
|
|
143
149
|
csv_detective/parsing/excel.py,sha256=AslE2S1e67o8yTIAIhp-lAnJ6-XqeBBRz1-VMFqhZBM,7055
|
|
144
150
|
csv_detective/parsing/load.py,sha256=u6fbGFZsL2GwPQRzhAXgt32JpUur7vbQdErREHxNJ-w,3661
|
|
145
151
|
csv_detective/parsing/text.py,sha256=_TprGi0gHZlRsafizI3dqQhBehZW4BazqxmypMcAZ-o,1824
|
|
146
|
-
csv_detective-0.8.1.
|
|
147
|
-
csv_detective-0.8.1.
|
|
148
|
-
csv_detective-0.8.1.
|
|
149
|
-
csv_detective-0.8.1.
|
|
152
|
+
csv_detective-0.8.1.dev1509.data/data/share/csv_detective/CHANGELOG.md,sha256=em97ZkXiZcpRQnOj7zCgZRtGL6sbaQvyPN6C1UvT4Dk,9034
|
|
153
|
+
csv_detective-0.8.1.dev1509.data/data/share/csv_detective/LICENSE,sha256=A1dQrzxyxRHRih02KwibWj1khQyF7GeA6SqdOU87Gk4,1088
|
|
154
|
+
csv_detective-0.8.1.dev1509.data/data/share/csv_detective/README.md,sha256=gKLFmC8kuCCywS9eAhMak_JNriUWWNOsBKleAu5TIEY,8501
|
|
155
|
+
csv_detective-0.8.1.dev1509.dist-info/licenses/LICENSE,sha256=A1dQrzxyxRHRih02KwibWj1khQyF7GeA6SqdOU87Gk4,1088
|
|
150
156
|
tests/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
151
157
|
tests/test_example.py,sha256=JeHxSK0IVDcSrOhSZlNGSQv4JAc_r6mzvJM8PfmLTMw,2018
|
|
152
158
|
tests/test_fields.py,sha256=d2tNvjtal6ZbO646x1GDbp_CGgp-EIcdg2SgMG72J6E,10270
|
|
153
|
-
tests/test_file.py,sha256=
|
|
159
|
+
tests/test_file.py,sha256=0bHV9wx9mSRoav_DVF19g694yohb1p0bw7rtcBeKG-8,8451
|
|
154
160
|
tests/test_labels.py,sha256=Nkr645bUewrj8hjNDKr67FQ6Sy_TID6f3E5Kfkl231M,464
|
|
155
161
|
tests/test_structure.py,sha256=bv-tjgXohvQAxwmxzH0BynFpK2TyPjcxvtIAmIRlZmA,1393
|
|
156
162
|
tests/test_validation.py,sha256=CTGonR6htxcWF9WH8MxumDD8cF45Y-G4hm94SM4lFjU,3246
|
|
157
|
-
csv_detective-0.8.1.
|
|
158
|
-
csv_detective-0.8.1.
|
|
159
|
-
csv_detective-0.8.1.
|
|
160
|
-
csv_detective-0.8.1.
|
|
161
|
-
csv_detective-0.8.1.
|
|
163
|
+
csv_detective-0.8.1.dev1509.dist-info/METADATA,sha256=V_xchinM2b_RyUVCxSmEB4UA66Q0IdIjkMfSi2bwf6E,10443
|
|
164
|
+
csv_detective-0.8.1.dev1509.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
165
|
+
csv_detective-0.8.1.dev1509.dist-info/entry_points.txt,sha256=JjweTReFqKJmuvkegzlew2j3D5pZzfxvbEGOtGVGmaY,56
|
|
166
|
+
csv_detective-0.8.1.dev1509.dist-info/top_level.txt,sha256=M0Nv646VHo-49zWjPkwo2C48UmtfddV8_9mEZeIxy8Q,20
|
|
167
|
+
csv_detective-0.8.1.dev1509.dist-info/RECORD,,
|
tests/test_file.py
CHANGED
|
@@ -7,12 +7,11 @@ from csv_detective import routine
|
|
|
7
7
|
|
|
8
8
|
|
|
9
9
|
@pytest.mark.parametrize(
|
|
10
|
-
"
|
|
11
|
-
(
|
|
10
|
+
"max_rows_analysis",
|
|
11
|
+
(100, int(1e5)),
|
|
12
12
|
)
|
|
13
|
-
def test_columns_output_on_file(
|
|
14
|
-
|
|
15
|
-
with patch("csv_detective.detection.formats.MAX_ROWS_ANALYSIS", patched):
|
|
13
|
+
def test_columns_output_on_file(max_rows_analysis):
|
|
14
|
+
with patch("csv_detective.detection.formats.MAX_ROWS_ANALYSIS", max_rows_analysis):
|
|
16
15
|
output = routine(
|
|
17
16
|
file_path="tests/data/a_test_file.csv",
|
|
18
17
|
num_rows=-1,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{csv_detective-0.8.1.dev1491.dist-info → csv_detective-0.8.1.dev1509.dist-info}/entry_points.txt
RENAMED
|
File without changes
|
{csv_detective-0.8.1.dev1491.dist-info → csv_detective-0.8.1.dev1509.dist-info}/licenses/LICENSE
RENAMED
|
File without changes
|
{csv_detective-0.8.1.dev1491.dist-info → csv_detective-0.8.1.dev1509.dist-info}/top_level.txt
RENAMED
|
File without changes
|