data-designer 0.3.8__py3-none-any.whl → 0.3.8rc2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
data_designer/_version.py CHANGED
@@ -28,7 +28,7 @@ version_tuple: VERSION_TUPLE
28
28
  commit_id: COMMIT_ID
29
29
  __commit_id__: COMMIT_ID
30
30
 
31
- __version__ = version = '0.3.8'
32
- __version_tuple__ = version_tuple = (0, 3, 8)
31
+ __version__ = version = '0.3.8rc2'
32
+ __version_tuple__ = version_tuple = (0, 3, 8, 'rc2')
33
33
 
34
34
  __commit_id__ = commit_id = None
@@ -353,11 +353,9 @@ PREDEFINED_PROVIDERS_MODEL_MAP = {
353
353
  NEMOTRON_PERSONAS_DATASET_SIZES = {
354
354
  "en_US": "1.24 GB",
355
355
  "en_IN": "2.39 GB",
356
- "en_SG": "0.30 GB",
357
356
  "hi_Deva_IN": "4.14 GB",
358
357
  "hi_Latn_IN": "2.7 GB",
359
358
  "ja_JP": "1.69 GB",
360
- "pt_BR": "2.33 GB",
361
359
  }
362
360
 
363
361
  LOCALES_WITH_MANAGED_DATASETS = list[str](NEMOTRON_PERSONAS_DATASET_SIZES.keys())
@@ -40,16 +40,13 @@ PII_FIELDS = [
40
40
  "state",
41
41
  "email_address",
42
42
  "phone_number",
43
- # Brazil-specific fields
44
- "race",
45
43
  # Japan-specific fields
46
44
  "area",
47
45
  "prefecture",
48
46
  "zone",
49
- # Brazil and India shared fields
50
- "religion",
51
47
  # India-specific fields
52
48
  "district",
49
+ "religion",
53
50
  "education_degree",
54
51
  "first_language",
55
52
  "second_language",
@@ -81,10 +78,9 @@ PERSONA_FIELDS = [
81
78
  # Japan-specific persona fields
82
79
  "aspects",
83
80
  "digital_skills",
84
- # Brazil and India shared persona fields
85
- "religious_persona",
86
- "religious_background",
87
81
  # India-specific persona fields
88
82
  "linguistic_persona",
83
+ "religious_persona",
89
84
  "linguistic_background",
85
+ "religious_background",
90
86
  ]
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: data-designer
3
- Version: 0.3.8
3
+ Version: 0.3.8rc2
4
4
  Summary: General framework for synthetic data generation
5
5
  License-Expression: Apache-2.0
6
6
  License-File: LICENSE
@@ -1,5 +1,5 @@
1
1
  data_designer/__init__.py,sha256=iLr6FpW41-DFbGexuXCJ6gN1xBMNUZ2jfj9XxySmQhk,502
2
- data_designer/_version.py,sha256=iWEYFk8Ve-UDYmpiH5KfwfwhQTYtkxZlaGPwKE2xDy0,704
2
+ data_designer/_version.py,sha256=wP4Vt8OKUu98a4RThXFwdZlfYV_E8tf8D24DFaCFjqg,714
3
3
  data_designer/errors.py,sha256=r1pBvmvRBAsPmb7oF_veubhkxZ2uPo9cGEDwykLziX4,220
4
4
  data_designer/lazy_heavy_imports.py,sha256=wULSEPQRUOZXvOnb0tdf6wNbRBpaaczYfAjY-pstCBM,1512
5
5
  data_designer/logging.py,sha256=gRi9BOqm95UC1-u4pn6n-G4EySy9HhwKVyKLRO4aqm4,5382
@@ -63,7 +63,7 @@ data_designer/config/analysis/dataset_profiler.py,sha256=-5eX55IXivwUBMg2pI-d_3e
63
63
  data_designer/config/analysis/utils/errors.py,sha256=pvmdQ_YuIlWW4NFw-cX_rOoQf-GG8y_FiQzNctB__DQ,331
64
64
  data_designer/config/analysis/utils/reporting.py,sha256=teTzd1OHtpI4vbIinGOGsKXyNldO3F5eqbNdAztF0_s,7066
65
65
  data_designer/config/utils/code_lang.py,sha256=EqMJh1GL5ysUZIoyqx_6vmqenUKHm4J-RQtKXiA4EPg,2354
66
- data_designer/config/utils/constants.py,sha256=eqDQ57b8B0v5qRSO0He45LEjSxtfxlsPtHRvBu1xkw0,8973
66
+ data_designer/config/utils/constants.py,sha256=KU4ZCIe18gXdBp2N_BgZlRW90FIqjFPYmJtqgVY3Ink,8925
67
67
  data_designer/config/utils/errors.py,sha256=HCjer0YrF0bMn5j8gmgWaLb0395LAr_hxMD1ftOsOc8,520
68
68
  data_designer/config/utils/info.py,sha256=yOa4U8kI_CY4OfCKZxCm2okU8klAiThvyjKM5tG-F0A,3469
69
69
  data_designer/config/utils/io_helpers.py,sha256=kzvOR7QgqijkqU-O2enIlpCWwHvzc3oRaEl4Lsjh1Do,8466
@@ -164,7 +164,7 @@ data_designer/engine/sampling_gen/data_sources/base.py,sha256=zUG5XTplD5pgHh4ytC
164
164
  data_designer/engine/sampling_gen/data_sources/errors.py,sha256=_9rbwUpaz0Pd2Ods4AVDQ7Uq4JvPyfHhTp51BdtJDto,367
165
165
  data_designer/engine/sampling_gen/data_sources/sources.py,sha256=53KVPp7REjNKA0rajGmT_tBkxwQqwrcIKhcijBGcfcs,13647
166
166
  data_designer/engine/sampling_gen/entities/__init__.py,sha256=XLO09Ei8g0lU7hYlzKCvhvQhLFBe5CBwE4v2PqK9xWY,142
167
- data_designer/engine/sampling_gen/entities/dataset_based_person_fields.py,sha256=r8qXWe8EquJognihPNGzma4fFuSQAAZHlkYVsGmcX2w,2006
167
+ data_designer/engine/sampling_gen/entities/dataset_based_person_fields.py,sha256=0_eUTtrWFGxTfTfqlz9ig9bJEtYeckb50J7w5LhYTr8,1883
168
168
  data_designer/engine/sampling_gen/entities/email_address_utils.py,sha256=THfD7muq5tMHkRWOATN-N3iSFgkKjT4e8hKquDFMTlU,5272
169
169
  data_designer/engine/sampling_gen/entities/errors.py,sha256=SbtwwG6JgoY4k6pq2-y-lD60nX_pqjf5QftmwgXt0us,352
170
170
  data_designer/engine/sampling_gen/entities/national_id_utils.py,sha256=XUFB6RhfLGFQUNyy0B6BSgtrG9NdEnIjfSALBwJplho,2652
@@ -189,8 +189,8 @@ data_designer/plugins/registry.py,sha256=Cnt33Q25o9bS2v2YDbV3QPM57VNrtIBKAb4ERQR
189
189
  data_designer/plugins/testing/__init__.py,sha256=yyxrrH_i3q0Xb56QO9Ma35WtHlQ5PJF1b2pQoKa16xU,296
190
190
  data_designer/plugins/testing/stubs.py,sha256=9tUF209ayZR6f0Q1LsRDW4kEOTgPoIxV8jlq4QoWuW0,3498
191
191
  data_designer/plugins/testing/utils.py,sha256=a9LEgK827cnIzHEkgXOdgywrKDLBE36cyttrpG1ctT4,973
192
- data_designer-0.3.8.dist-info/METADATA,sha256=n9jXs34c2_rOL-Tme5Y6xrb4fMo0-GNNEVHlCl5WfLY,8119
193
- data_designer-0.3.8.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
194
- data_designer-0.3.8.dist-info/entry_points.txt,sha256=NWWWidyDxN6CYX6y664PhBYMhbaYTQTyprqfYAgkyCg,57
195
- data_designer-0.3.8.dist-info/licenses/LICENSE,sha256=cSWJDwVqHyQgly8Zmt3pqXJ2eQbZVYwN9qd0NMssxXY,11336
196
- data_designer-0.3.8.dist-info/RECORD,,
192
+ data_designer-0.3.8rc2.dist-info/METADATA,sha256=-gMHOKpWpc0HRy8QfQb4KQkEqeYJaHbxlL_l9M1PKmk,8122
193
+ data_designer-0.3.8rc2.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
194
+ data_designer-0.3.8rc2.dist-info/entry_points.txt,sha256=NWWWidyDxN6CYX6y664PhBYMhbaYTQTyprqfYAgkyCg,57
195
+ data_designer-0.3.8rc2.dist-info/licenses/LICENSE,sha256=cSWJDwVqHyQgly8Zmt3pqXJ2eQbZVYwN9qd0NMssxXY,11336
196
+ data_designer-0.3.8rc2.dist-info/RECORD,,