additory 0.1.0a1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (87) hide show
  1. additory/__init__.py +15 -0
  2. additory/analysis/__init__.py +48 -0
  3. additory/analysis/cardinality.py +126 -0
  4. additory/analysis/correlations.py +124 -0
  5. additory/analysis/distributions.py +376 -0
  6. additory/analysis/quality.py +158 -0
  7. additory/analysis/scan.py +400 -0
  8. additory/augment/__init__.py +24 -0
  9. additory/augment/augmentor.py +653 -0
  10. additory/augment/builtin_lists.py +430 -0
  11. additory/augment/distributions.py +22 -0
  12. additory/augment/forecast.py +1132 -0
  13. additory/augment/list_registry.py +177 -0
  14. additory/augment/smote.py +320 -0
  15. additory/augment/strategies.py +883 -0
  16. additory/common/__init__.py +157 -0
  17. additory/common/backend.py +355 -0
  18. additory/common/column_utils.py +191 -0
  19. additory/common/distributions.py +737 -0
  20. additory/common/exceptions.py +62 -0
  21. additory/common/lists.py +229 -0
  22. additory/common/patterns.py +240 -0
  23. additory/common/resolver.py +567 -0
  24. additory/common/sample_data.py +182 -0
  25. additory/common/validation.py +197 -0
  26. additory/core/__init__.py +27 -0
  27. additory/core/ast_builder.py +165 -0
  28. additory/core/backends/__init__.py +23 -0
  29. additory/core/backends/arrow_bridge.py +476 -0
  30. additory/core/backends/cudf_bridge.py +355 -0
  31. additory/core/column_positioning.py +358 -0
  32. additory/core/compiler_polars.py +166 -0
  33. additory/core/config.py +342 -0
  34. additory/core/enhanced_cache_manager.py +1119 -0
  35. additory/core/enhanced_matchers.py +473 -0
  36. additory/core/enhanced_version_manager.py +325 -0
  37. additory/core/executor.py +59 -0
  38. additory/core/integrity_manager.py +477 -0
  39. additory/core/loader.py +190 -0
  40. additory/core/logging.py +24 -0
  41. additory/core/memory_manager.py +547 -0
  42. additory/core/namespace_manager.py +657 -0
  43. additory/core/parser.py +176 -0
  44. additory/core/polars_expression_engine.py +551 -0
  45. additory/core/registry.py +176 -0
  46. additory/core/sample_data_manager.py +492 -0
  47. additory/core/user_namespace.py +751 -0
  48. additory/core/validator.py +27 -0
  49. additory/dynamic_api.py +308 -0
  50. additory/expressions/__init__.py +26 -0
  51. additory/expressions/engine.py +551 -0
  52. additory/expressions/parser.py +176 -0
  53. additory/expressions/proxy.py +546 -0
  54. additory/expressions/registry.py +313 -0
  55. additory/expressions/samples.py +492 -0
  56. additory/synthetic/__init__.py +101 -0
  57. additory/synthetic/api.py +220 -0
  58. additory/synthetic/common_integration.py +314 -0
  59. additory/synthetic/config.py +262 -0
  60. additory/synthetic/engines.py +529 -0
  61. additory/synthetic/exceptions.py +180 -0
  62. additory/synthetic/file_managers.py +518 -0
  63. additory/synthetic/generator.py +702 -0
  64. additory/synthetic/generator_parser.py +68 -0
  65. additory/synthetic/integration.py +319 -0
  66. additory/synthetic/models.py +241 -0
  67. additory/synthetic/pattern_resolver.py +573 -0
  68. additory/synthetic/performance.py +469 -0
  69. additory/synthetic/polars_integration.py +464 -0
  70. additory/synthetic/proxy.py +60 -0
  71. additory/synthetic/schema_parser.py +685 -0
  72. additory/synthetic/validator.py +553 -0
  73. additory/utilities/__init__.py +53 -0
  74. additory/utilities/encoding.py +600 -0
  75. additory/utilities/games.py +300 -0
  76. additory/utilities/keys.py +8 -0
  77. additory/utilities/lookup.py +103 -0
  78. additory/utilities/matchers.py +216 -0
  79. additory/utilities/resolvers.py +286 -0
  80. additory/utilities/settings.py +167 -0
  81. additory/utilities/units.py +746 -0
  82. additory/utilities/validators.py +153 -0
  83. additory-0.1.0a1.dist-info/METADATA +293 -0
  84. additory-0.1.0a1.dist-info/RECORD +87 -0
  85. additory-0.1.0a1.dist-info/WHEEL +5 -0
  86. additory-0.1.0a1.dist-info/licenses/LICENSE +21 -0
  87. additory-0.1.0a1.dist-info/top_level.txt +1 -0
@@ -0,0 +1,430 @@
1
+ """
2
+ Built-in Lists Registry for Data Augmentation
3
+
4
+ Provides globally available lists for choice-based augmentation strategies.
5
+ These lists are loaded in memory for instant access (O(1) lookup, zero I/O).
6
+
7
+ Users can override any list using add.register_list("list_name", [...])
8
+
9
+ List Resolution Order:
10
+ 1. User-registered lists (highest priority)
11
+ 2. Built-in lists (this module)
12
+ 3. Error if not found
13
+ """
14
+
15
+ # =============================================================================
16
+ # NAMES - Globally diverse names representing major world regions
17
+ # =============================================================================
18
+
19
+ FIRST_NAMES = [
20
+ # India & South Asia
21
+ "Arjun", "Vikram", "Samuel", "Harpreet", "Kabir", "Aarav", "Aadhya",
22
+ "Fatima", "Anita", "Zoya", "Meera", "Nisha", "Ayesha", "Ritika", "Ira",
23
+ "Dev", "Karan", "Rhea", "Tanvi", "Varun", "Neha", "Ishaan", "Tara",
24
+ "Aditya", "Kavya", "Suresh", "Priya", "Manish", "Shreya", "Naveen",
25
+ "Diya", "Rohit", "Ananya", "Kunal", "Pooja", "Raj", "Sneha", "Suraj",
26
+ "Lavanya", "Gaurav", "Shalini", "Mohan", "Vandana", "Karthik", "Bhavana",
27
+ "Raghav", "Simran", "Tejas", "Anjali", "Nitin", "Radhika", "Abhishek",
28
+ "Shweta", "Parth", "Ishita", "Siddharth", "Malini", "Vivek", "Yamini",
29
+ "Pranav", "Aarti", "Rajesh", "Komal", "Sanjay", "Madhuri", "Deepak",
30
+ "Sonali", "Hemant", "Kirti", "Ashok", "Rupa", "Jatin", "Leela", "Vinay",
31
+ "Charu", "Harish", "Nandini", "Shankar", "Pallavi", "Arvind", "Kusum",
32
+ "Manoj", "Gayatri", "Sagar", "Ritu", "Bharat", "Chitra", "Keshav", "Lata",
33
+ "Om", "Padma", "Yash", "Seema", "Kartik", "Madhav", "Veena", "Rohan",
34
+ "Amar", "Abdul", "Antony",
35
+ # Americas & Europe
36
+ "James", "Mary", "Robert", "Oliver", "Olivia", "George",
37
+ # East Asia
38
+ "Wei", "Mei", "Jun", "Haruto", "Yui", "Ren", "Min-jun", "Seo-yeon", "Ji-ho",
39
+ # Europe
40
+ "Gabriel", "Emma", "Louis", "Noah", "Emilia", "Leon", "Hugo", "Lucia",
41
+ "Mateo", "Leonardo", "Sofia", "Francesco", "Miguel", "Helena", "Arthur",
42
+ "Santiago", "Maria", "Jose", "Liam", "Charlotte", "William", "Alexander",
43
+ "Dmitry", "Mia", "Ethan",
44
+ # Africa
45
+ "Chinedu", "Aisha", "Oluwaseun",
46
+ # Middle East
47
+ "Mohamed", "Fatima", "Ahmed", "Yusuf", "Elif", "Mustafa", "Abdullah",
48
+ "Omar", "Mariam",
49
+ # Southeast Asia
50
+ "Putra", "Siti", "Agus", "Juan", "Angel", "Jose", "Rahim", "Ayesha",
51
+ "Karim", "Anh", "Linh", "Minh", "Niran", "Mali", "Arun",
52
+ # Additional
53
+ "Chloe", "Jayden", "Saif", "Khalid", "Daan", "Sem", "Lucas", "Alice",
54
+ "William", "Jakob", "Nora", "Emil", "Oscar", "Alma", "Jack", "Aoife",
55
+ "Conor", "Leo", "Isla"
56
+ ]
57
+
58
+ LAST_NAMES = [
59
+ # India & South Asia
60
+ "Rao", "Sharma", "Gupta", "Kumar", "Reddy", "Iyer", "Nair", "Pillai",
61
+ "Shetty", "Gowda", "Verma", "Yadav", "Chauhan", "Thakur", "Jha", "Tiwari",
62
+ "Mishra", "Pandey", "Shukla", "Saxena", "Bhat", "Naidu", "Kulkarni",
63
+ "Deshmukh", "Patil", "Joshi", "Shinde", "Gaikwad", "Salvi", "Khatri",
64
+ "Kapoor", "Khanna", "Mehta", "Shah", "Soni", "Modi", "Jain", "Agarwal",
65
+ "Bansal", "Mahajan", "Chawla", "Sethi", "Malhotra", "Anand", "Chopra",
66
+ "Gill", "Sandhu", "Sidhu", "Ahluwalia", "Bajwa", "Rawat", "Negi", "Bisht",
67
+ "Rana", "Sinha", "Bose", "Roy", "Dutta", "Mukherjee", "Sengupta",
68
+ "Chakraborty", "Basu", "Deb", "Paul", "Sen", "Konar", "Mondal", "Pal",
69
+ "Saha", "Halder", "Barik", "Behera", "Pradhan", "Swain", "Mohanty", "Raut",
70
+ "Jadhav", "Pawar", "Kamble", "More", "Wagh", "Lokhande", "Bendre", "Naik",
71
+ "Hegde", "Babu", "Varma", "Menon", "Cherian", "Kurian", "Thomas", "Mathew",
72
+ "George", "Abraham", "Philip", "Sunny", "Chacko", "Joseph", "Antony",
73
+ # Americas & Europe
74
+ "Smith", "Johnson", "Williams", "Jones", "Taylor", "Wang", "Chen", "Zhao",
75
+ "Sato", "Suzuki", "Takahashi", "Kim", "Lee", "Park", "Martin", "Bernard",
76
+ "Dubois", "Muller", "Schmidt", "Schneider", "Garcia", "Fernandez", "Lopez",
77
+ "Rossi", "Russo", "Ferrari", "Silva", "Santos", "Oliveira", "Hernandez",
78
+ "Martinez", "Brown", "Tremblay", "Ivanov", "Smirnov", "Kuznetsov",
79
+ # Africa
80
+ "Nkosi", "Botha", "Dlamini", "Okafor", "Ibrahim", "Adeyemi",
81
+ # Middle East
82
+ "Hassan", "Ali", "Youssef", "Yilmaz", "Kaya", "Demir", "Al-Saud",
83
+ "Al-Harbi", "Al-Qahtani",
84
+ # Southeast Asia
85
+ "Pratama", "Wijaya", "Saputra", "Dela Cruz", "Reyes", "Khan", "Malik",
86
+ "Chowdhury", "Islam", "Rahman", "Ahmed", "Nguyen", "Tran", "Le", "Saetang",
87
+ "Boonmee", "Chaiyaporn", "Tan", "Lim", "Al-Nahyan", "Al-Mansoori",
88
+ "Al-Falasi", "de Jong", "Jansen", "de Vries", "Andersson", "Johansson",
89
+ "Karlsson", "Hansen", "Johansen", "Olsen", "Nielsen", "Jensen", "Murphy",
90
+ "Kelly", "O'Brien", "Patel", "Das", "Chatterjee", "Banerjee", "Ghosh"
91
+ ]
92
+
93
+ # =============================================================================
94
+ # FINANCIAL - Major global banks and financial institutions
95
+ # =============================================================================
96
+
97
+ BANKS = [
98
+ # India
99
+ "State Bank of India (SBI)", "HDFC Bank", "ICICI Bank", "Axis Bank",
100
+ "Kotak Mahindra Bank", "Bank of Baroda", "Punjab National Bank",
101
+ "Canara Bank", "Union Bank of India", "IDFC First Bank",
102
+ # China
103
+ "Industrial and Commercial Bank of China", "China Construction Bank",
104
+ "Agricultural Bank of China", "Bank of China", "Bank of Communications",
105
+ "China Merchants Bank", "Postal Savings Bank of China", "Industrial Bank Co",
106
+ "Shanghai Pudong Development Bank",
107
+ # Japan
108
+ "Mitsubishi UFJ Financial Group", "Sumitomo Mitsui Financial Group",
109
+ "Mizuho Financial Group", "Resona Holdings", "Japan Post Bank",
110
+ # United States
111
+ "JPMorgan Chase", "Bank of America", "Citibank", "Wells Fargo",
112
+ "Goldman Sachs", "Morgan Stanley", "US Bank", "PNC Financial",
113
+ "Truist Financial", "Capital One",
114
+ # United Kingdom
115
+ "HSBC", "Barclays", "Lloyds Banking Group", "NatWest Group",
116
+ "Standard Chartered",
117
+ # Canada
118
+ "Royal Bank of Canada", "Toronto Dominion Bank", "Scotiabank",
119
+ "Bank of Montreal", "CIBC",
120
+ # France
121
+ "BNP Paribas", "Credit Agricole", "Societe Generale", "BPCE Group",
122
+ "La Banque Postale",
123
+ # Germany
124
+ "Deutsche Bank", "Commerzbank", "KfW Bankengruppe", "DZ Bank",
125
+ "Landesbank Baden Wuerttemberg",
126
+ # Switzerland
127
+ "UBS", "Julius Baer", "Raiffeisen Switzerland",
128
+ # Italy
129
+ "UniCredit", "Intesa Sanpaolo", "Banco BPM", "BPER Banca",
130
+ # Spain
131
+ "Santander", "BBVA", "CaixaBank", "Bankinter",
132
+ # Netherlands
133
+ "ING Group", "Rabobank", "ABN AMRO",
134
+ # Sweden
135
+ "Nordea", "SEB", "Swedbank", "Handelsbanken",
136
+ # Norway & Denmark
137
+ "DNB", "Danske Bank",
138
+ # Singapore
139
+ "DBS Bank", "OCBC Bank", "UOB",
140
+ # Malaysia
141
+ "Maybank", "CIMB Group", "RHB Bank",
142
+ # Indonesia
143
+ "Bank Mandiri", "Bank Rakyat Indonesia", "Bank Central Asia",
144
+ # South Korea
145
+ "KB Financial Group", "Shinhan Financial Group", "Hana Financial Group",
146
+ "Woori Bank",
147
+ # Australia
148
+ "Commonwealth Bank of Australia", "Westpac", "ANZ", "NAB",
149
+ # Brazil
150
+ "Itau Unibanco", "Banco Bradesco", "Banco do Brasil",
151
+ "Caixa Economica Federal",
152
+ # Mexico
153
+ "BBVA Mexico", "Banorte"
154
+ ]
155
+
156
+ CREDIT_CARD_NETWORKS = [
157
+ # Global majors
158
+ "Visa", "Mastercard", "American Express", "Discover",
159
+ "Diners Club International", "UnionPay",
160
+ # Japan
161
+ "JCB",
162
+ # India
163
+ "RuPay", "NCMC National Common Mobility Card",
164
+ # United States (additional networks)
165
+ "Pulse", "Star", "NYCE", "Accel", "Shazam", "Interlink", "Maestro",
166
+ "Cirrus", "Plus",
167
+ # Europe
168
+ "Girocard", "Cartes Bancaires", "Bancontact", "V Pay",
169
+ "EAPS European Alliance Payment Scheme", "Link UK ATM Network",
170
+ "PostePay Italy", "Multibanco Portugal",
171
+ # United Kingdom
172
+ "Switch", "Solo",
173
+ # Canada
174
+ "Interac", "Debit Mastercard Canada", "Visa Debit Canada",
175
+ # Latin America
176
+ "Elo Brazil", "Hipercard Brazil", "Cabal Argentina", "Naranja X Argentina",
177
+ "Red Link Argentina", "Banelco Argentina",
178
+ # Middle East
179
+ "Meeza Egypt", "Benefit Bahrain", "KNET Kuwait", "Mada Saudi Arabia",
180
+ "QatarPay", "OmanNet", "UAE Switch",
181
+ # Africa
182
+ "Verve Nigeria", "Interswitch", "GhLink Ghana", "Zimswitch Zimbabwe",
183
+ "KenSwitch Kenya", "Namclear Namibia",
184
+ # Southeast Asia
185
+ "GPN Indonesia", "PromptCard Thailand", "NETS Singapore",
186
+ "Touch n Go Malaysia", "MyDebit Malaysia", "BancNet Philippines",
187
+ "Vietcombank Card Vietnam",
188
+ # East Asia (non China/Japan)
189
+ "T Money Korea", "Cashbee Korea",
190
+ # China (additional)
191
+ "QuickPass", "China T Union Transit Card",
192
+ # Australia / New Zealand
193
+ "eftpos Australia", "BPAY", "Paymark New Zealand",
194
+ # Digital only / fintech card networks
195
+ "Revolut Card Network", "Nubank Card Network", "Monzo Card Network",
196
+ "Starling Card Network", "Chime Card Network", "Cash App Card Network",
197
+ # Private label / store card networks
198
+ "Target RedCard Network", "Walmart Card Network", "Costco Card Network",
199
+ "Amazon Store Card Network", "Best Buy Card Network"
200
+ ]
201
+
202
+ # =============================================================================
203
+ # RETAIL - Major global retailers and e-commerce platforms
204
+ # =============================================================================
205
+
206
+ RETAILERS = [
207
+ # India
208
+ "Reliance Retail", "DMart", "Tata Croma", "Big Bazaar", "Spencers Retail",
209
+ "V Mart", "More Retail", "Trent Westside", "Future Retail", "Shoppers Stop",
210
+ "Lifestyle India", "Pantaloons", "Fabindia", "Nykaa", "Myntra", "Flipkart",
211
+ "Tanishq", "Titan Company", "Apollo Pharmacy", "MedPlus",
212
+ # United States
213
+ "Walmart", "Amazon", "Costco", "Target", "Kroger", "Home Depot", "Lowes",
214
+ "Best Buy", "Walgreens", "CVS Pharmacy", "Macys", "Kohl's", "TJ Maxx",
215
+ "Dollar General", "Dollar Tree", "Nordstrom", "Sears", "Staples",
216
+ "Office Depot", "Whole Foods Market",
217
+ # United Kingdom
218
+ "Tesco", "Sainsbury's", "Asda", "Marks and Spencer", "John Lewis", "Argos",
219
+ "Boots", "Morrisons", "Next", "Primark",
220
+ # Europe (France, Germany, Spain, etc.)
221
+ "Carrefour", "Auchan", "Aldi", "Lidl", "Metro AG", "Edeka", "Rewe",
222
+ "El Corte Ingles", "MediaMarkt", "Decathlon",
223
+ # Japan
224
+ "Aeon", "Seven and I Holdings", "FamilyMart", "Lawson", "Don Quijote",
225
+ # China
226
+ "JD Retail", "Alibaba Tmall", "Suning", "Gome Retail", "Yonghui Superstores",
227
+ # South Korea
228
+ "Lotte Mart", "Shinsegae", "E Mart", "Homeplus",
229
+ # Southeast Asia
230
+ "Robinsons Philippines", "SM Retail", "Central Group Thailand",
231
+ "Big C Thailand", "VinMart Vietnam",
232
+ # Middle East
233
+ "Lulu Hypermarket", "Carrefour UAE", "Danube Saudi Arabia",
234
+ "Panda Retail Saudi Arabia", "Choithrams",
235
+ # Australia
236
+ "Woolworths Australia", "Coles", "JB Hi Fi", "Harvey Norman", "Myer",
237
+ # Africa
238
+ "Shoprite", "Pick n Pay", "Game Stores", "Massmart", "Nakumatt",
239
+ # Latin America
240
+ "Mercado Libre", "Falabella", "Cencosud", "Grupo Pao de Acucar",
241
+ "Liverpool Mexico"
242
+ ]
243
+
244
+ # =============================================================================
245
+ # TECHNOLOGY - Major global technology companies
246
+ # =============================================================================
247
+
248
+ TECH_COMPANIES = [
249
+ # India
250
+ "Tata Consultancy Services", "Infosys", "Wipro", "HCL Technologies",
251
+ "Tech Mahindra", "Larsen and Toubro Infotech", "Mindtree",
252
+ "Persistent Systems", "Mphasis", "Zensar Technologies", "Birlasoft",
253
+ "Hexaware Technologies", "NIIT Technologies", "Coforge",
254
+ "Reliance Jio Platforms", "Bharti Airtel Digital", "Zoho", "Freshworks",
255
+ "InMobi", "Quick Heal",
256
+ # Taiwan
257
+ "TSMC", "MediaTek", "Foxconn", "UMC", "ASE Technology",
258
+ "Realtek Semiconductor", "Novatek Microelectronics", "AU Optronics",
259
+ "Delta Electronics", "Pegatron", "Quanta Computer", "Compal Electronics",
260
+ "Wistron", "Macronix", "Winbond Electronics",
261
+ # United States
262
+ "Apple", "Microsoft", "Google", "Amazon Web Services", "Meta Platforms",
263
+ "IBM", "Intel", "Nvidia", "AMD", "Oracle", "Salesforce", "Adobe", "Cisco",
264
+ "Qualcomm", "HP", "Dell Technologies", "Uber", "Airbnb", "Palantir",
265
+ "Snowflake",
266
+ # United Kingdom
267
+ "ARM", "Sage Group", "Micro Focus", "BT Group", "Vodafone",
268
+ # Europe
269
+ "SAP", "Siemens", "Bosch", "Capgemini", "Atos", "Nokia", "Ericsson",
270
+ "Dassault Systemes", "Infineon Technologies", "STMicroelectronics",
271
+ # Japan
272
+ "Sony", "Panasonic", "Toshiba", "Fujitsu", "NEC", "Hitachi", "SoftBank",
273
+ "Rakuten", "Nintendo", "Canon",
274
+ # China
275
+ "Huawei", "Tencent", "Alibaba", "Baidu", "Xiaomi", "Lenovo", "ZTE",
276
+ "ByteDance", "JD Technology", "Hikvision",
277
+ # South Korea
278
+ "Samsung Electronics", "LG Electronics", "SK Hynix", "Naver", "Kakao",
279
+ # Southeast Asia
280
+ "Grab", "Sea Group", "GoTo Group", "FPT Software", "VNG Corporation",
281
+ # Middle East
282
+ "STC Solutions", "eFinance Egypt", "Etisalat Digital", "Aramco Digital",
283
+ "Beeah Digital",
284
+ # Australia
285
+ "Atlassian", "Telstra", "WiseTech Global", "Afterpay", "Canva",
286
+ # Africa
287
+ "MTN Group", "Safaricom", "Liquid Intelligent Technologies", "Naspers",
288
+ "Cell C",
289
+ # Latin America
290
+ "Mercado Libre", "Nubank", "TOTVS", "PagSeguro", "Globant"
291
+ ]
292
+
293
+ EMAIL_PROVIDERS = [
294
+ # Global giants
295
+ "gmail.com", "yahoo.com", "outlook.com", "hotmail.com", "live.com",
296
+ "icloud.com", "aol.com", "protonmail.com", "zoho.com", "mail.com",
297
+ # India
298
+ "rediffmail.com", "in.com", "sify.com", "airtelmail.in", "bsnl.in",
299
+ # USA
300
+ "msn.com", "comcast.net", "verizon.net", "att.net", "me.com", "mac.com",
301
+ # Europe
302
+ "gmx.com", "gmx.de", "web.de", "orange.fr", "free.fr", "laposte.net",
303
+ "btinternet.com", "virginmedia.com", "sky.com",
304
+ # UK
305
+ "hotmail.co.uk", "yahoo.co.uk", "live.co.uk",
306
+ # Germany
307
+ "t-online.de", "posteo.de", "mailbox.org",
308
+ # France
309
+ "sfr.fr", "wanadoo.fr",
310
+ # Russia
311
+ "mail.ru", "yandex.com", "yandex.ru", "rambler.ru",
312
+ # China
313
+ "qq.com", "163.com", "126.com", "sina.com", "sohu.com",
314
+ # Japan
315
+ "yahoo.co.jp", "docomo.ne.jp", "ezweb.ne.jp", "softbank.ne.jp",
316
+ # Korea
317
+ "naver.com", "daum.net", "hanmail.net",
318
+ # Middle East
319
+ "emirates.net.ae", "etisalat.ae", "saudi.net.sa",
320
+ # Africa
321
+ "webmail.co.za", "mtn.co.za",
322
+ # Latin America
323
+ "uol.com.br", "bol.com.br", "terra.com.br", "hotmail.com.mx", "live.com.mx",
324
+ # Southeast Asia
325
+ "singnet.com.sg", "starhub.net.sg", "tm.net.my", "pldt.com.ph",
326
+ "yahoo.com.ph",
327
+ # Australia / NZ
328
+ "bigpond.com", "optusnet.com.au", "xtra.co.nz",
329
+ # Privacy-focused / SaaS
330
+ "fastmail.com", "hey.com",
331
+ # Generic / testing domains
332
+ "example.com", "test.com", "demo.com", "sample.com", "mailtest.com",
333
+ "placeholder.com", "domain.com"
334
+ ]
335
+
336
+ # =============================================================================
337
+ # BUSINESS - Common business categories and classifications
338
+ # =============================================================================
339
+
340
+ DEPARTMENTS = [
341
+ # Core Business Functions
342
+ "Human Resources", "Finance", "Accounting", "Sales", "Marketing",
343
+ "Operations", "Customer Service", "Customer Support",
344
+ # Technology & Engineering
345
+ "Information Technology", "Engineering", "Research and Development",
346
+ "Product Development", "Data Science", "Quality Assurance",
347
+ # Supply Chain & Logistics
348
+ "Supply Chain", "Procurement", "Logistics", "Warehouse",
349
+ # Legal & Compliance
350
+ "Legal", "Compliance", "Risk Management", "Internal Audit",
351
+ # Strategic & Executive
352
+ "Strategy", "Business Development", "Corporate Development", "Executive",
353
+ # Specialized
354
+ "Manufacturing", "Production", "Facilities", "Security", "Administration",
355
+ "Training", "Communications", "Public Relations"
356
+ ]
357
+
358
+ STATUSES = [
359
+ "Active", "Inactive", "Pending", "Completed", "Cancelled",
360
+ "In Progress", "On Hold", "Approved", "Rejected", "Draft"
361
+ ]
362
+
363
+ SEVERITIES = [
364
+ "Low", "Medium", "High", "Critical", "Urgent"
365
+ ]
366
+
367
+ PRIORITIES = [
368
+ "Low", "Medium", "High", "Critical"
369
+ ]
370
+
371
+ # =============================================================================
372
+ # MEDICAL - Common medical and healthcare terms
373
+ # =============================================================================
374
+
375
+ ADVERSE_EVENTS = [
376
+ "Headache", "Nausea", "Vomiting", "Dizziness", "Fatigue",
377
+ "Fever", "Chills", "Rash", "Itching", "Swelling",
378
+ "Pain", "Muscle Ache", "Joint Pain", "Weakness", "Insomnia",
379
+ "Anxiety", "Depression", "Confusion", "Tremor", "Seizure",
380
+ "Shortness of Breath", "Cough", "Chest Pain", "Palpitations",
381
+ "Edema", "Hypertension", "Hypotension", "Tachycardia"
382
+ ]
383
+
384
+ # =============================================================================
385
+ # MASTER REGISTRY - Maps list names to actual lists
386
+ # =============================================================================
387
+
388
+ BUILTIN_LISTS = {
389
+ # Names
390
+ "first_names": FIRST_NAMES,
391
+ "last_names": LAST_NAMES,
392
+ # Financial
393
+ "banks": BANKS,
394
+ "credit_card_networks": CREDIT_CARD_NETWORKS,
395
+ # Retail
396
+ "retailers": RETAILERS,
397
+ # Technology
398
+ "tech_companies": TECH_COMPANIES,
399
+ "email_providers": EMAIL_PROVIDERS,
400
+ # Business
401
+ "departments": DEPARTMENTS,
402
+ "statuses": STATUSES,
403
+ "severities": SEVERITIES,
404
+ "priorities": PRIORITIES,
405
+ # Medical
406
+ "adverse_events": ADVERSE_EVENTS,
407
+ }
408
+
409
+
410
+ def get_builtin_list(name: str):
411
+ """
412
+ Get a built-in list by name.
413
+
414
+ Args:
415
+ name: List name (e.g., "first_names", "banks")
416
+
417
+ Returns:
418
+ List of values or None if not found
419
+ """
420
+ return BUILTIN_LISTS.get(name)
421
+
422
+
423
+ def list_builtin_names():
424
+ """
425
+ Get all available built-in list names.
426
+
427
+ Returns:
428
+ List of list names
429
+ """
430
+ return list(BUILTIN_LISTS.keys())
@@ -0,0 +1,22 @@
1
+ """
2
+ Distribution Strategies for Data Augmentation
3
+
4
+ DEPRECATED: This module has been moved to additory.common.distributions
5
+ Please update your imports to use additory.common.distributions instead.
6
+
7
+ This file is kept for backward compatibility and will be removed in a future version.
8
+ """
9
+
10
+ import warnings
11
+
12
+ # Issue deprecation warning
13
+ warnings.warn(
14
+ "additory.augment.distributions is deprecated. "
15
+ "Please use additory.common.distributions instead. "
16
+ "This module will be removed in a future version.",
17
+ DeprecationWarning,
18
+ stacklevel=2
19
+ )
20
+
21
+ # Import everything from common.distributions for backward compatibility
22
+ from additory.common.distributions import * # noqa: F401, F403