@civiq/entity-resolution 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (81) hide show
  1. package/LICENSE +21 -0
  2. package/README.md +135 -0
  3. package/data/bioguide-fec-mapping.json +4186 -0
  4. package/data/sec-sic-data.json +10427 -0
  5. package/dist/__tests__/company-entity-resolver.test.d.ts +6 -0
  6. package/dist/__tests__/company-entity-resolver.test.d.ts.map +1 -0
  7. package/dist/__tests__/company-entity-resolver.test.js +267 -0
  8. package/dist/__tests__/company-entity-resolver.test.js.map +1 -0
  9. package/dist/__tests__/entity-resolution.test.d.ts +2 -0
  10. package/dist/__tests__/entity-resolution.test.d.ts.map +1 -0
  11. package/dist/__tests__/entity-resolution.test.js +296 -0
  12. package/dist/__tests__/entity-resolution.test.js.map +1 -0
  13. package/dist/__tests__/fec-entity-resolution.test.d.ts +2 -0
  14. package/dist/__tests__/fec-entity-resolution.test.d.ts.map +1 -0
  15. package/dist/__tests__/fec-entity-resolution.test.js +49 -0
  16. package/dist/__tests__/fec-entity-resolution.test.js.map +1 -0
  17. package/dist/bioguide-fec-mapping.d.ts +27 -0
  18. package/dist/bioguide-fec-mapping.d.ts.map +1 -0
  19. package/dist/bioguide-fec-mapping.js +57 -0
  20. package/dist/bioguide-fec-mapping.js.map +1 -0
  21. package/dist/cache.d.ts +18 -0
  22. package/dist/cache.d.ts.map +1 -0
  23. package/dist/cache.js +18 -0
  24. package/dist/cache.js.map +1 -0
  25. package/dist/committee-agency-map.d.ts +58 -0
  26. package/dist/committee-agency-map.d.ts.map +1 -0
  27. package/dist/committee-agency-map.js +658 -0
  28. package/dist/committee-agency-map.js.map +1 -0
  29. package/dist/committee-alias-table.d.ts +11 -0
  30. package/dist/committee-alias-table.d.ts.map +1 -0
  31. package/dist/committee-alias-table.js +191 -0
  32. package/dist/committee-alias-table.js.map +1 -0
  33. package/dist/company-alias-table.d.ts +36 -0
  34. package/dist/company-alias-table.d.ts.map +1 -0
  35. package/dist/company-alias-table.js +1307 -0
  36. package/dist/company-alias-table.js.map +1 -0
  37. package/dist/company-entity-resolver.d.ts +94 -0
  38. package/dist/company-entity-resolver.d.ts.map +1 -0
  39. package/dist/company-entity-resolver.js +282 -0
  40. package/dist/company-entity-resolver.js.map +1 -0
  41. package/dist/configure.d.ts +15 -0
  42. package/dist/configure.d.ts.map +1 -0
  43. package/dist/configure.js +19 -0
  44. package/dist/configure.js.map +1 -0
  45. package/dist/fec-entity-resolution.d.ts +88 -0
  46. package/dist/fec-entity-resolution.d.ts.map +1 -0
  47. package/dist/fec-entity-resolution.js +407 -0
  48. package/dist/fec-entity-resolution.js.map +1 -0
  49. package/dist/index.d.ts +30 -0
  50. package/dist/index.d.ts.map +1 -0
  51. package/dist/index.js +33 -0
  52. package/dist/index.js.map +1 -0
  53. package/dist/industry-taxonomy.d.ts +90 -0
  54. package/dist/industry-taxonomy.d.ts.map +1 -0
  55. package/dist/industry-taxonomy.js +1026 -0
  56. package/dist/industry-taxonomy.js.map +1 -0
  57. package/dist/lda-issue-policy-map.d.ts +13 -0
  58. package/dist/lda-issue-policy-map.d.ts.map +1 -0
  59. package/dist/lda-issue-policy-map.js +193 -0
  60. package/dist/lda-issue-policy-map.js.map +1 -0
  61. package/dist/lobbying-committee-resolver.d.ts +23 -0
  62. package/dist/lobbying-committee-resolver.d.ts.map +1 -0
  63. package/dist/lobbying-committee-resolver.js +158 -0
  64. package/dist/lobbying-committee-resolver.js.map +1 -0
  65. package/dist/logger.d.ts +20 -0
  66. package/dist/logger.d.ts.map +1 -0
  67. package/dist/logger.js +20 -0
  68. package/dist/logger.js.map +1 -0
  69. package/dist/sic-sector-map.d.ts +32 -0
  70. package/dist/sic-sector-map.d.ts.map +1 -0
  71. package/dist/sic-sector-map.js +109 -0
  72. package/dist/sic-sector-map.js.map +1 -0
  73. package/dist/ticker-industry-resolver.d.ts +22 -0
  74. package/dist/ticker-industry-resolver.d.ts.map +1 -0
  75. package/dist/ticker-industry-resolver.js +254 -0
  76. package/dist/ticker-industry-resolver.js.map +1 -0
  77. package/dist/types.d.ts +30 -0
  78. package/dist/types.d.ts.map +1 -0
  79. package/dist/types.js +6 -0
  80. package/dist/types.js.map +1 -0
  81. package/package.json +51 -0
@@ -0,0 +1,1307 @@
1
+ /**
2
+ * Copyright (c) 2019-2025 Mark Sandford
3
+ * Licensed under the MIT License. See LICENSE and NOTICE files.
4
+ */
5
+ /**
6
+ * Company Alias Table
7
+ *
8
+ * Static mapping of top companies by lobbying spend with known name
9
+ * variants across federal APIs: EPA, OSHA, CFPB, SEC, FEC, and LDA
10
+ * (Senate Lobbying Disclosure Act filings).
11
+ *
12
+ * Each entry has a canonical name, known aliases, SIC codes, sector,
13
+ * and SEC CIK where available. The alias lookup is case-insensitive
14
+ * and strips corporate suffixes before matching.
15
+ */
16
+ import { IndustrySector } from './industry-taxonomy';
17
+ /**
18
+ * Top companies by lobbying spend with cross-API name variants.
19
+ * Ordered roughly by total lobbying expenditure (descending).
20
+ */
21
+ export const COMPANY_ALIAS_TABLE = [
22
+ // ── Pharmaceuticals & Health ────────────────────────────────────────
23
+ {
24
+ canonicalName: 'PFIZER',
25
+ aliases: ['PFIZER INC', 'PFIZER INC.', 'PFIZER PHARMACEUTICALS', 'PFE'],
26
+ sicCodes: ['2834'],
27
+ naicsCodes: ['325412'],
28
+ sector: IndustrySector.HEALTH,
29
+ cik: '78003',
30
+ },
31
+ {
32
+ canonicalName: 'JOHNSON AND JOHNSON',
33
+ aliases: [
34
+ 'JOHNSON & JOHNSON',
35
+ 'J&J',
36
+ 'JNJ',
37
+ 'JOHNSON AND JOHNSON INC',
38
+ 'JOHNSON & JOHNSON INC.',
39
+ 'JANSSEN PHARMACEUTICALS',
40
+ 'JANSSEN BIOTECH',
41
+ ],
42
+ sicCodes: ['2834', '3841'],
43
+ naicsCodes: ['325412', '339112'],
44
+ sector: IndustrySector.HEALTH,
45
+ cik: '200406',
46
+ },
47
+ {
48
+ canonicalName: 'MERCK',
49
+ aliases: [
50
+ 'MERCK & CO',
51
+ 'MERCK AND CO',
52
+ 'MERCK & CO INC',
53
+ 'MERCK & CO., INC.',
54
+ 'MERCK SHARP & DOHME',
55
+ 'MSD',
56
+ 'MRK',
57
+ ],
58
+ sicCodes: ['2834'],
59
+ naicsCodes: ['325412'],
60
+ sector: IndustrySector.HEALTH,
61
+ cik: '310158',
62
+ },
63
+ {
64
+ canonicalName: 'ABBVIE',
65
+ aliases: ['ABBVIE INC', 'ABBVIE INC.', 'ABBV'],
66
+ sicCodes: ['2834'],
67
+ naicsCodes: ['325412'],
68
+ sector: IndustrySector.HEALTH,
69
+ cik: '1551152',
70
+ },
71
+ {
72
+ canonicalName: 'ELI LILLY',
73
+ aliases: ['ELI LILLY AND COMPANY', 'ELI LILLY & CO', 'LILLY', 'LLY', 'ELI LILLY AND CO'],
74
+ sicCodes: ['2834'],
75
+ naicsCodes: ['325412'],
76
+ sector: IndustrySector.HEALTH,
77
+ cik: '59478',
78
+ },
79
+ {
80
+ canonicalName: 'AMGEN',
81
+ aliases: ['AMGEN INC', 'AMGEN INC.', 'AMGN'],
82
+ sicCodes: ['2836'],
83
+ naicsCodes: ['325414'],
84
+ sector: IndustrySector.HEALTH,
85
+ cik: '318154',
86
+ },
87
+ {
88
+ canonicalName: 'BRISTOL MYERS SQUIBB',
89
+ aliases: [
90
+ 'BRISTOL-MYERS SQUIBB',
91
+ 'BRISTOL-MYERS SQUIBB CO',
92
+ 'BRISTOL MYERS SQUIBB CO',
93
+ 'BMS',
94
+ 'BMY',
95
+ ],
96
+ sicCodes: ['2834'],
97
+ naicsCodes: ['325412'],
98
+ sector: IndustrySector.HEALTH,
99
+ cik: '14272',
100
+ },
101
+ {
102
+ canonicalName: 'UNITEDHEALTH GROUP',
103
+ aliases: [
104
+ 'UNITEDHEALTH GROUP INC',
105
+ 'UNITEDHEALTH GROUP INCORPORATED',
106
+ 'UNITED HEALTH GROUP',
107
+ 'UNH',
108
+ 'UNITEDHEALTHCARE',
109
+ ],
110
+ sicCodes: ['6324'],
111
+ naicsCodes: ['524114'],
112
+ sector: IndustrySector.HEALTH,
113
+ cik: '731766',
114
+ },
115
+ {
116
+ canonicalName: 'CVS HEALTH',
117
+ aliases: ['CVS HEALTH CORP', 'CVS HEALTH CORPORATION', 'CVS CAREMARK', 'CVS PHARMACY', 'CVS'],
118
+ sicCodes: ['5912'],
119
+ naicsCodes: ['446110'],
120
+ sector: IndustrySector.HEALTH,
121
+ cik: '64803',
122
+ },
123
+ {
124
+ canonicalName: 'CIGNA',
125
+ aliases: ['CIGNA CORP', 'CIGNA CORPORATION', 'THE CIGNA GROUP', 'CI'],
126
+ sicCodes: ['6321'],
127
+ naicsCodes: ['524114'],
128
+ sector: IndustrySector.HEALTH,
129
+ cik: '1739940',
130
+ },
131
+ {
132
+ canonicalName: 'ANTHEM',
133
+ aliases: [
134
+ 'ANTHEM INC',
135
+ 'ELEVANCE HEALTH',
136
+ 'ELEVANCE HEALTH INC',
137
+ 'WELLPOINT',
138
+ 'WELLPOINT INC',
139
+ 'ELV',
140
+ ],
141
+ sicCodes: ['6324'],
142
+ naicsCodes: ['524114'],
143
+ sector: IndustrySector.HEALTH,
144
+ cik: '1156039',
145
+ },
146
+ {
147
+ canonicalName: 'HUMANA',
148
+ aliases: ['HUMANA INC', 'HUMANA INC.', 'HUM'],
149
+ sicCodes: ['6324'],
150
+ naicsCodes: ['524114'],
151
+ sector: IndustrySector.HEALTH,
152
+ cik: '49071',
153
+ },
154
+ {
155
+ canonicalName: 'MEDTRONIC',
156
+ aliases: ['MEDTRONIC PLC', 'MEDTRONIC INC', 'MDT'],
157
+ sicCodes: ['3841'],
158
+ naicsCodes: ['339112'],
159
+ sector: IndustrySector.HEALTH,
160
+ cik: '1613103',
161
+ },
162
+ {
163
+ canonicalName: 'ABBOTT LABORATORIES',
164
+ aliases: ['ABBOTT LABS', 'ABBOTT', 'ABT'],
165
+ sicCodes: ['3841'],
166
+ naicsCodes: ['339112'],
167
+ sector: IndustrySector.HEALTH,
168
+ cik: '1800',
169
+ },
170
+ // ── Technology & Communications ─────────────────────────────────────
171
+ {
172
+ canonicalName: 'ALPHABET',
173
+ aliases: ['ALPHABET INC', 'GOOGLE', 'GOOGLE INC', 'GOOGLE LLC', 'GOOG', 'GOOGL'],
174
+ sicCodes: ['7372'],
175
+ naicsCodes: ['519130'],
176
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
177
+ cik: '1652044',
178
+ },
179
+ {
180
+ canonicalName: 'META PLATFORMS',
181
+ aliases: [
182
+ 'META PLATFORMS INC',
183
+ 'META',
184
+ 'FACEBOOK',
185
+ 'FACEBOOK INC',
186
+ 'FB',
187
+ 'META PLATFORMS INC.',
188
+ ],
189
+ sicCodes: ['7372'],
190
+ naicsCodes: ['519130'],
191
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
192
+ cik: '1326801',
193
+ },
194
+ {
195
+ canonicalName: 'AMAZON',
196
+ aliases: [
197
+ 'AMAZON.COM',
198
+ 'AMAZON.COM INC',
199
+ 'AMAZON COM INC',
200
+ 'AMAZON INC',
201
+ 'AMZN',
202
+ 'AMAZON WEB SERVICES',
203
+ 'AWS',
204
+ ],
205
+ sicCodes: ['5961'],
206
+ naicsCodes: ['454110'],
207
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
208
+ cik: '1018724',
209
+ },
210
+ {
211
+ canonicalName: 'APPLE',
212
+ aliases: ['APPLE INC', 'APPLE INC.', 'AAPL', 'APPLE COMPUTER'],
213
+ sicCodes: ['3571'],
214
+ naicsCodes: ['334111'],
215
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
216
+ cik: '320193',
217
+ },
218
+ {
219
+ canonicalName: 'MICROSOFT',
220
+ aliases: ['MICROSOFT CORP', 'MICROSOFT CORPORATION', 'MSFT'],
221
+ sicCodes: ['7372'],
222
+ naicsCodes: ['511210'],
223
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
224
+ cik: '789019',
225
+ },
226
+ {
227
+ canonicalName: 'AT AND T',
228
+ aliases: [
229
+ 'AT&T',
230
+ 'AT&T INC',
231
+ 'AT&T INC.',
232
+ 'ATT',
233
+ 'AT AND T INC',
234
+ 'AMERICAN TELEPHONE AND TELEGRAPH',
235
+ 'SOUTHWESTERN BELL',
236
+ 'T',
237
+ ],
238
+ sicCodes: ['4813'],
239
+ naicsCodes: ['517110'],
240
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
241
+ cik: '732717',
242
+ },
243
+ {
244
+ canonicalName: 'COMCAST',
245
+ aliases: [
246
+ 'COMCAST CORP',
247
+ 'COMCAST CORPORATION',
248
+ 'COMCAST NBCUNIVERSAL',
249
+ 'NBCUNIVERSAL',
250
+ 'CMCSA',
251
+ ],
252
+ sicCodes: ['4841'],
253
+ naicsCodes: ['517110'],
254
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
255
+ cik: '902739',
256
+ },
257
+ {
258
+ canonicalName: 'VERIZON',
259
+ aliases: ['VERIZON COMMUNICATIONS', 'VERIZON COMMUNICATIONS INC', 'VZ', 'VERIZON WIRELESS'],
260
+ sicCodes: ['4813'],
261
+ naicsCodes: ['517110'],
262
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
263
+ cik: '732712',
264
+ },
265
+ {
266
+ canonicalName: 'INTEL',
267
+ aliases: ['INTEL CORP', 'INTEL CORPORATION', 'INTC'],
268
+ sicCodes: ['3674'],
269
+ naicsCodes: ['334413'],
270
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
271
+ cik: '50863',
272
+ },
273
+ {
274
+ canonicalName: 'QUALCOMM',
275
+ aliases: ['QUALCOMM INC', 'QUALCOMM INCORPORATED', 'QCOM'],
276
+ sicCodes: ['3674'],
277
+ naicsCodes: ['334413'],
278
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
279
+ cik: '804328',
280
+ },
281
+ {
282
+ canonicalName: 'ORACLE',
283
+ aliases: ['ORACLE CORP', 'ORACLE CORPORATION', 'ORCL'],
284
+ sicCodes: ['7372'],
285
+ naicsCodes: ['511210'],
286
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
287
+ cik: '1341439',
288
+ },
289
+ {
290
+ canonicalName: 'IBM',
291
+ aliases: [
292
+ 'INTERNATIONAL BUSINESS MACHINES',
293
+ 'INTERNATIONAL BUSINESS MACHINES CORP',
294
+ 'IBM CORP',
295
+ ],
296
+ sicCodes: ['7372'],
297
+ naicsCodes: ['511210'],
298
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
299
+ cik: '51143',
300
+ },
301
+ {
302
+ canonicalName: 'CISCO',
303
+ aliases: ['CISCO SYSTEMS', 'CISCO SYSTEMS INC', 'CSCO'],
304
+ sicCodes: ['3577'],
305
+ naicsCodes: ['334290'],
306
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
307
+ cik: '858877',
308
+ },
309
+ {
310
+ canonicalName: 'SALESFORCE',
311
+ aliases: ['SALESFORCE INC', 'SALESFORCE.COM', 'CRM'],
312
+ sicCodes: ['7372'],
313
+ naicsCodes: ['511210'],
314
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
315
+ cik: '1108524',
316
+ },
317
+ {
318
+ canonicalName: 'NVIDIA',
319
+ aliases: ['NVIDIA CORP', 'NVIDIA CORPORATION', 'NVDA'],
320
+ sicCodes: ['3674'],
321
+ naicsCodes: ['334413'],
322
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
323
+ cik: '1045810',
324
+ },
325
+ {
326
+ canonicalName: 'BROADCOM',
327
+ aliases: ['BROADCOM INC', 'AVAGO TECHNOLOGIES', 'AVGO'],
328
+ sicCodes: ['3674'],
329
+ naicsCodes: ['334413'],
330
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
331
+ cik: '1649338',
332
+ },
333
+ {
334
+ canonicalName: 'T-MOBILE',
335
+ aliases: ['T-MOBILE US', 'T-MOBILE US INC', 'TMUS', 'SPRINT', 'SPRINT CORP'],
336
+ sicCodes: ['4812'],
337
+ naicsCodes: ['517210'],
338
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
339
+ cik: '1283699',
340
+ },
341
+ // ── Defense & Aerospace ─────────────────────────────────────────────
342
+ {
343
+ canonicalName: 'LOCKHEED MARTIN',
344
+ aliases: ['LOCKHEED MARTIN CORP', 'LOCKHEED MARTIN CORPORATION', 'LOCKMART', 'LMT', 'LOCKHEED'],
345
+ sicCodes: ['3761'],
346
+ naicsCodes: ['336411'],
347
+ sector: IndustrySector.DEFENSE,
348
+ cik: '936468',
349
+ },
350
+ {
351
+ canonicalName: 'RAYTHEON TECHNOLOGIES',
352
+ aliases: [
353
+ 'RAYTHEON',
354
+ 'RTX',
355
+ 'RTX CORP',
356
+ 'RAYTHEON CO',
357
+ 'RAYTHEON COMPANY',
358
+ 'UNITED TECHNOLOGIES',
359
+ 'UNITED TECHNOLOGIES CORP',
360
+ ],
361
+ sicCodes: ['3724'],
362
+ naicsCodes: ['336411'],
363
+ sector: IndustrySector.DEFENSE,
364
+ cik: '101829',
365
+ },
366
+ {
367
+ canonicalName: 'BOEING',
368
+ aliases: ['THE BOEING COMPANY', 'BOEING CO', 'BOEING COMPANY', 'BA'],
369
+ sicCodes: ['3721'],
370
+ naicsCodes: ['336411'],
371
+ sector: IndustrySector.DEFENSE,
372
+ cik: '12927',
373
+ },
374
+ {
375
+ canonicalName: 'NORTHROP GRUMMAN',
376
+ aliases: ['NORTHROP GRUMMAN CORP', 'NORTHROP GRUMMAN CORPORATION', 'NOC', 'NORTHRUP GRUMMAN'],
377
+ sicCodes: ['3761'],
378
+ naicsCodes: ['336411'],
379
+ sector: IndustrySector.DEFENSE,
380
+ cik: '1133421',
381
+ },
382
+ {
383
+ canonicalName: 'GENERAL DYNAMICS',
384
+ aliases: ['GENERAL DYNAMICS CORP', 'GENERAL DYNAMICS CORPORATION', 'GD'],
385
+ sicCodes: ['3731'],
386
+ naicsCodes: ['336611'],
387
+ sector: IndustrySector.DEFENSE,
388
+ cik: '40533',
389
+ },
390
+ {
391
+ canonicalName: 'L3HARRIS TECHNOLOGIES',
392
+ aliases: [
393
+ 'L3HARRIS',
394
+ 'L3 HARRIS',
395
+ 'L3 TECHNOLOGIES',
396
+ 'HARRIS CORP',
397
+ 'HARRIS CORPORATION',
398
+ 'LHX',
399
+ ],
400
+ sicCodes: ['3812'],
401
+ naicsCodes: ['334511'],
402
+ sector: IndustrySector.DEFENSE,
403
+ cik: '202058',
404
+ },
405
+ {
406
+ canonicalName: 'BAE SYSTEMS',
407
+ aliases: ['BAE SYSTEMS INC', 'BAE SYSTEMS PLC', 'BAE'],
408
+ sicCodes: ['3812'],
409
+ naicsCodes: ['334511'],
410
+ sector: IndustrySector.DEFENSE,
411
+ cik: null,
412
+ },
413
+ {
414
+ canonicalName: 'LEIDOS',
415
+ aliases: ['LEIDOS HOLDINGS', 'LEIDOS INC', 'LDOS', 'SAIC'],
416
+ sicCodes: ['7371'],
417
+ naicsCodes: ['541512'],
418
+ sector: IndustrySector.DEFENSE,
419
+ cik: '1336920',
420
+ },
421
+ {
422
+ canonicalName: 'HUNTINGTON INGALLS',
423
+ aliases: ['HUNTINGTON INGALLS INDUSTRIES', 'HII', 'NEWPORT NEWS SHIPBUILDING'],
424
+ sicCodes: ['3731'],
425
+ naicsCodes: ['336611'],
426
+ sector: IndustrySector.DEFENSE,
427
+ cik: '1501585',
428
+ },
429
+ // ── Energy & Natural Resources ──────────────────────────────────────
430
+ {
431
+ canonicalName: 'EXXON MOBIL',
432
+ aliases: [
433
+ 'EXXONMOBIL',
434
+ 'EXXON MOBIL CORP',
435
+ 'EXXON MOBIL CORPORATION',
436
+ 'XOM',
437
+ 'EXXON',
438
+ 'MOBIL',
439
+ 'EXXON CHEMICAL',
440
+ ],
441
+ sicCodes: ['2911'],
442
+ naicsCodes: ['324110'],
443
+ sector: IndustrySector.ENERGY_NATURAL_RESOURCES,
444
+ cik: '34088',
445
+ },
446
+ {
447
+ canonicalName: 'CHEVRON',
448
+ aliases: ['CHEVRON CORP', 'CHEVRON CORPORATION', 'CVX', 'CHEVRON USA', 'CHEVRON TEXACO'],
449
+ sicCodes: ['2911'],
450
+ naicsCodes: ['324110'],
451
+ sector: IndustrySector.ENERGY_NATURAL_RESOURCES,
452
+ cik: '93410',
453
+ },
454
+ {
455
+ canonicalName: 'CONOCOPHILLIPS',
456
+ aliases: ['CONOCO PHILLIPS', 'CONOCOPHILLIPS CO', 'COP', 'CONOCO'],
457
+ sicCodes: ['1311'],
458
+ naicsCodes: ['211120'],
459
+ sector: IndustrySector.ENERGY_NATURAL_RESOURCES,
460
+ cik: '1163165',
461
+ },
462
+ {
463
+ canonicalName: 'KOCH INDUSTRIES',
464
+ aliases: [
465
+ 'KOCH INDUSTRIES INC',
466
+ 'KOCH',
467
+ 'KOCH COMPANIES',
468
+ 'GEORGIA-PACIFIC',
469
+ 'GEORGIA PACIFIC',
470
+ 'FLINT HILLS RESOURCES',
471
+ 'INVISTA',
472
+ ],
473
+ sicCodes: ['2911'],
474
+ naicsCodes: ['324110'],
475
+ sector: IndustrySector.ENERGY_NATURAL_RESOURCES,
476
+ cik: null,
477
+ },
478
+ {
479
+ canonicalName: 'DUKE ENERGY',
480
+ aliases: ['DUKE ENERGY CORP', 'DUKE ENERGY CORPORATION', 'DUK'],
481
+ sicCodes: ['4911'],
482
+ naicsCodes: ['221112'],
483
+ sector: IndustrySector.ENERGY_NATURAL_RESOURCES,
484
+ cik: '1326160',
485
+ },
486
+ {
487
+ canonicalName: 'SOUTHERN COMPANY',
488
+ aliases: ['THE SOUTHERN COMPANY', 'SOUTHERN CO', 'SO', 'GEORGIA POWER', 'ALABAMA POWER'],
489
+ sicCodes: ['4911'],
490
+ naicsCodes: ['221112'],
491
+ sector: IndustrySector.ENERGY_NATURAL_RESOURCES,
492
+ cik: '92122',
493
+ },
494
+ {
495
+ canonicalName: 'NEXTERA ENERGY',
496
+ aliases: [
497
+ 'NEXTERA ENERGY INC',
498
+ 'NEE',
499
+ 'FPL GROUP',
500
+ 'FLORIDA POWER AND LIGHT',
501
+ 'FLORIDA POWER & LIGHT',
502
+ ],
503
+ sicCodes: ['4911'],
504
+ naicsCodes: ['221112'],
505
+ sector: IndustrySector.ENERGY_NATURAL_RESOURCES,
506
+ cik: '753308',
507
+ },
508
+ {
509
+ canonicalName: 'DOMINION ENERGY',
510
+ aliases: ['DOMINION ENERGY INC', 'DOMINION', 'D'],
511
+ sicCodes: ['4911'],
512
+ naicsCodes: ['221112'],
513
+ sector: IndustrySector.ENERGY_NATURAL_RESOURCES,
514
+ cik: '715957',
515
+ },
516
+ {
517
+ canonicalName: 'PHILLIPS 66',
518
+ aliases: ['PHILLIPS 66 CO', 'PSX'],
519
+ sicCodes: ['2911'],
520
+ naicsCodes: ['324110'],
521
+ sector: IndustrySector.ENERGY_NATURAL_RESOURCES,
522
+ cik: '1534701',
523
+ },
524
+ {
525
+ canonicalName: 'VALERO ENERGY',
526
+ aliases: ['VALERO ENERGY CORP', 'VALERO', 'VLO'],
527
+ sicCodes: ['2911'],
528
+ naicsCodes: ['324110'],
529
+ sector: IndustrySector.ENERGY_NATURAL_RESOURCES,
530
+ cik: '1035002',
531
+ },
532
+ {
533
+ canonicalName: 'DEVON ENERGY',
534
+ aliases: ['DEVON ENERGY CORP', 'DVN'],
535
+ sicCodes: ['1311'],
536
+ naicsCodes: ['211120'],
537
+ sector: IndustrySector.ENERGY_NATURAL_RESOURCES,
538
+ cik: '1090012',
539
+ },
540
+ {
541
+ canonicalName: 'HALLIBURTON',
542
+ aliases: ['HALLIBURTON CO', 'HALLIBURTON COMPANY', 'HAL'],
543
+ sicCodes: ['1381'],
544
+ naicsCodes: ['213111'],
545
+ sector: IndustrySector.ENERGY_NATURAL_RESOURCES,
546
+ cik: '45012',
547
+ },
548
+ // ── Finance / Insurance / Real Estate ───────────────────────────────
549
+ {
550
+ canonicalName: 'JPMORGAN CHASE',
551
+ aliases: [
552
+ 'JPMORGAN CHASE & CO',
553
+ 'JPMORGAN CHASE AND CO',
554
+ 'JP MORGAN CHASE',
555
+ 'JP MORGAN',
556
+ 'JPMORGAN',
557
+ 'JPM',
558
+ 'CHASE',
559
+ 'J.P. MORGAN',
560
+ ],
561
+ sicCodes: ['6020'],
562
+ naicsCodes: ['522110'],
563
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
564
+ cik: '19617',
565
+ },
566
+ {
567
+ canonicalName: 'BANK OF AMERICA',
568
+ aliases: [
569
+ 'BANK OF AMERICA CORP',
570
+ 'BANK OF AMERICA CORPORATION',
571
+ 'BOFA',
572
+ 'BAC',
573
+ 'MERRILL LYNCH',
574
+ 'BANK OF AMERICA NA',
575
+ ],
576
+ sicCodes: ['6020'],
577
+ naicsCodes: ['522110'],
578
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
579
+ cik: '70858',
580
+ },
581
+ {
582
+ canonicalName: 'GOLDMAN SACHS',
583
+ aliases: ['THE GOLDMAN SACHS GROUP', 'GOLDMAN SACHS GROUP', 'GOLDMAN SACHS & CO', 'GS'],
584
+ sicCodes: ['6211'],
585
+ naicsCodes: ['523110'],
586
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
587
+ cik: '886982',
588
+ },
589
+ {
590
+ canonicalName: 'CITIGROUP',
591
+ aliases: ['CITIGROUP INC', 'CITIBANK', 'CITI', 'C', 'CITICORP'],
592
+ sicCodes: ['6020'],
593
+ naicsCodes: ['522110'],
594
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
595
+ cik: '831001',
596
+ },
597
+ {
598
+ canonicalName: 'WELLS FARGO',
599
+ aliases: ['WELLS FARGO & CO', 'WELLS FARGO AND COMPANY', 'WELLS FARGO BANK', 'WFC'],
600
+ sicCodes: ['6020'],
601
+ naicsCodes: ['522110'],
602
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
603
+ cik: '72971',
604
+ },
605
+ {
606
+ canonicalName: 'MORGAN STANLEY',
607
+ aliases: ['MORGAN STANLEY & CO', 'MS'],
608
+ sicCodes: ['6211'],
609
+ naicsCodes: ['523110'],
610
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
611
+ cik: '895421',
612
+ },
613
+ {
614
+ canonicalName: 'BLACKROCK',
615
+ aliases: ['BLACKROCK INC', 'BLACKROCK FINANCIAL', 'BLK'],
616
+ sicCodes: ['6282'],
617
+ naicsCodes: ['523920'],
618
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
619
+ cik: '1364742',
620
+ },
621
+ {
622
+ canonicalName: 'CHARLES SCHWAB',
623
+ aliases: ['THE CHARLES SCHWAB CORPORATION', 'CHARLES SCHWAB CORP', 'SCHWAB', 'SCHW'],
624
+ sicCodes: ['6211'],
625
+ naicsCodes: ['523120'],
626
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
627
+ cik: '316709',
628
+ },
629
+ {
630
+ canonicalName: 'AMERICAN EXPRESS',
631
+ aliases: ['AMERICAN EXPRESS CO', 'AMEX', 'AXP'],
632
+ sicCodes: ['6153'],
633
+ naicsCodes: ['522210'],
634
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
635
+ cik: '4962',
636
+ },
637
+ {
638
+ canonicalName: 'CAPITAL ONE',
639
+ aliases: ['CAPITAL ONE FINANCIAL', 'CAPITAL ONE FINANCIAL CORP', 'COF'],
640
+ sicCodes: ['6020'],
641
+ naicsCodes: ['522110'],
642
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
643
+ cik: '927628',
644
+ },
645
+ {
646
+ canonicalName: 'US BANCORP',
647
+ aliases: ['U.S. BANCORP', 'US BANK', 'USB'],
648
+ sicCodes: ['6020'],
649
+ naicsCodes: ['522110'],
650
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
651
+ cik: '36104',
652
+ },
653
+ {
654
+ canonicalName: 'PNC FINANCIAL',
655
+ aliases: ['PNC FINANCIAL SERVICES', 'PNC FINANCIAL SERVICES GROUP', 'PNC BANK', 'PNC'],
656
+ sicCodes: ['6020'],
657
+ naicsCodes: ['522110'],
658
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
659
+ cik: '713676',
660
+ },
661
+ {
662
+ canonicalName: 'BERKSHIRE HATHAWAY',
663
+ aliases: ['BERKSHIRE HATHAWAY INC', 'BRK', 'BRKB'],
664
+ sicCodes: ['6331'],
665
+ naicsCodes: ['524126'],
666
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
667
+ cik: '1067983',
668
+ },
669
+ // ── Chemicals & Manufacturing ───────────────────────────────────────
670
+ {
671
+ canonicalName: 'DOW',
672
+ aliases: [
673
+ 'DOW INC',
674
+ 'DOW INC.',
675
+ 'DOW CHEMICAL',
676
+ 'DOW CHEMICAL CO',
677
+ 'DOW CHEMICAL COMPANY',
678
+ 'THE DOW CHEMICAL COMPANY',
679
+ 'DOW CHEMICAL CO TEXAS OPERATIONS',
680
+ 'DOW CHEMICAL CO FREEPORT TX',
681
+ 'DOW CHEMICAL MIDLAND',
682
+ ],
683
+ sicCodes: ['2821'],
684
+ naicsCodes: ['325211'],
685
+ sector: IndustrySector.MISC_BUSINESS,
686
+ cik: '1751788',
687
+ },
688
+ {
689
+ canonicalName: 'DUPONT',
690
+ aliases: [
691
+ 'DUPONT DE NEMOURS',
692
+ 'E I DU PONT DE NEMOURS',
693
+ 'EI DUPONT',
694
+ 'DD',
695
+ 'DUPONT INC',
696
+ 'CHEMOURS',
697
+ ],
698
+ sicCodes: ['2821'],
699
+ naicsCodes: ['325211'],
700
+ sector: IndustrySector.MISC_BUSINESS,
701
+ cik: '1666700',
702
+ },
703
+ {
704
+ canonicalName: '3M',
705
+ aliases: ['3M COMPANY', '3M CO', 'MINNESOTA MINING AND MANUFACTURING', 'MMM'],
706
+ sicCodes: ['3841'],
707
+ naicsCodes: ['339999'],
708
+ sector: IndustrySector.MISC_BUSINESS,
709
+ cik: '66740',
710
+ },
711
+ {
712
+ canonicalName: 'BASF',
713
+ aliases: ['BASF CORP', 'BASF CORPORATION', 'BASF SE'],
714
+ sicCodes: ['2810'],
715
+ naicsCodes: ['325110'],
716
+ sector: IndustrySector.MISC_BUSINESS,
717
+ cik: null,
718
+ },
719
+ {
720
+ canonicalName: 'HONEYWELL',
721
+ aliases: ['HONEYWELL INTERNATIONAL', 'HONEYWELL INTERNATIONAL INC', 'HON'],
722
+ sicCodes: ['3728'],
723
+ naicsCodes: ['334512'],
724
+ sector: IndustrySector.DEFENSE,
725
+ cik: '773840',
726
+ },
727
+ {
728
+ canonicalName: 'CATERPILLAR',
729
+ aliases: ['CATERPILLAR INC', 'CAT'],
730
+ sicCodes: ['3531'],
731
+ naicsCodes: ['333120'],
732
+ sector: IndustrySector.MISC_BUSINESS,
733
+ cik: '18230',
734
+ },
735
+ {
736
+ canonicalName: 'GENERAL ELECTRIC',
737
+ aliases: ['GENERAL ELECTRIC CO', 'GENERAL ELECTRIC COMPANY', 'GE', 'GE AEROSPACE'],
738
+ sicCodes: ['3511'],
739
+ naicsCodes: ['336412'],
740
+ sector: IndustrySector.MISC_BUSINESS,
741
+ cik: '40554',
742
+ },
743
+ {
744
+ canonicalName: 'PROCTER AND GAMBLE',
745
+ aliases: [
746
+ 'PROCTER & GAMBLE',
747
+ 'PROCTER & GAMBLE CO',
748
+ 'THE PROCTER & GAMBLE COMPANY',
749
+ 'P&G',
750
+ 'PG',
751
+ ],
752
+ sicCodes: ['2841'],
753
+ naicsCodes: ['325611'],
754
+ sector: IndustrySector.MISC_BUSINESS,
755
+ cik: '80424',
756
+ },
757
+ // ── Transportation ──────────────────────────────────────────────────
758
+ {
759
+ canonicalName: 'UNION PACIFIC',
760
+ aliases: ['UNION PACIFIC CORP', 'UNION PACIFIC RAILROAD', 'UNP'],
761
+ sicCodes: ['4011'],
762
+ naicsCodes: ['482111'],
763
+ sector: IndustrySector.TRANSPORTATION,
764
+ cik: '100885',
765
+ },
766
+ {
767
+ canonicalName: 'FEDEX',
768
+ aliases: ['FEDEX CORP', 'FEDEX CORPORATION', 'FEDERAL EXPRESS', 'FDX'],
769
+ sicCodes: ['4513'],
770
+ naicsCodes: ['492110'],
771
+ sector: IndustrySector.TRANSPORTATION,
772
+ cik: '1048911',
773
+ },
774
+ {
775
+ canonicalName: 'UNITED PARCEL SERVICE',
776
+ aliases: ['UPS', 'UNITED PARCEL SERVICE INC'],
777
+ sicCodes: ['4215'],
778
+ naicsCodes: ['492110'],
779
+ sector: IndustrySector.TRANSPORTATION,
780
+ cik: '1090727',
781
+ },
782
+ {
783
+ canonicalName: 'DELTA AIR LINES',
784
+ aliases: ['DELTA AIR LINES INC', 'DELTA AIRLINES', 'DELTA', 'DAL'],
785
+ sicCodes: ['4512'],
786
+ naicsCodes: ['481111'],
787
+ sector: IndustrySector.TRANSPORTATION,
788
+ cik: '27904',
789
+ },
790
+ {
791
+ canonicalName: 'UNITED AIRLINES',
792
+ aliases: [
793
+ 'UNITED AIRLINES HOLDINGS',
794
+ 'UNITED AIRLINES HOLDINGS INC',
795
+ 'UNITED CONTINENTAL',
796
+ 'UAL',
797
+ ],
798
+ sicCodes: ['4512'],
799
+ naicsCodes: ['481111'],
800
+ sector: IndustrySector.TRANSPORTATION,
801
+ cik: '100517',
802
+ },
803
+ {
804
+ canonicalName: 'AMERICAN AIRLINES',
805
+ aliases: ['AMERICAN AIRLINES GROUP', 'AMERICAN AIRLINES GROUP INC', 'AAL', 'AMR CORP'],
806
+ sicCodes: ['4512'],
807
+ naicsCodes: ['481111'],
808
+ sector: IndustrySector.TRANSPORTATION,
809
+ cik: '6201',
810
+ },
811
+ {
812
+ canonicalName: 'NORFOLK SOUTHERN',
813
+ aliases: ['NORFOLK SOUTHERN CORP', 'NORFOLK SOUTHERN CORPORATION', 'NSC'],
814
+ sicCodes: ['4011'],
815
+ naicsCodes: ['482111'],
816
+ sector: IndustrySector.TRANSPORTATION,
817
+ cik: '73309',
818
+ },
819
+ // ── Consumer / Retail ───────────────────────────────────────────────
820
+ {
821
+ canonicalName: 'WALMART',
822
+ aliases: [
823
+ 'WALMART INC',
824
+ 'WAL-MART',
825
+ 'WAL MART',
826
+ 'WAL-MART STORES',
827
+ 'WAL-MART STORES INC',
828
+ 'WMT',
829
+ ],
830
+ sicCodes: ['5331'],
831
+ naicsCodes: ['452210'],
832
+ sector: IndustrySector.MISC_BUSINESS,
833
+ cik: '104169',
834
+ },
835
+ {
836
+ canonicalName: 'HOME DEPOT',
837
+ aliases: ['THE HOME DEPOT', 'HOME DEPOT INC', 'HD'],
838
+ sicCodes: ['5211'],
839
+ naicsCodes: ['444110'],
840
+ sector: IndustrySector.MISC_BUSINESS,
841
+ cik: '354950',
842
+ },
843
+ {
844
+ canonicalName: 'TARGET',
845
+ aliases: ['TARGET CORP', 'TARGET CORPORATION', 'TGT'],
846
+ sicCodes: ['5331'],
847
+ naicsCodes: ['452210'],
848
+ sector: IndustrySector.MISC_BUSINESS,
849
+ cik: '27419',
850
+ },
851
+ {
852
+ canonicalName: 'COSTCO',
853
+ aliases: ['COSTCO WHOLESALE', 'COSTCO WHOLESALE CORP', 'COST'],
854
+ sicCodes: ['5331'],
855
+ naicsCodes: ['452910'],
856
+ sector: IndustrySector.MISC_BUSINESS,
857
+ cik: '909832',
858
+ },
859
+ // ── Agriculture ─────────────────────────────────────────────────────
860
+ {
861
+ canonicalName: 'CARGILL',
862
+ aliases: ['CARGILL INC', 'CARGILL INCORPORATED'],
863
+ sicCodes: ['2041'],
864
+ naicsCodes: ['311211'],
865
+ sector: IndustrySector.AGRIBUSINESS,
866
+ cik: null,
867
+ },
868
+ {
869
+ canonicalName: 'ARCHER DANIELS MIDLAND',
870
+ aliases: ['ADM', 'ARCHER-DANIELS-MIDLAND', 'ARCHER DANIELS MIDLAND CO'],
871
+ sicCodes: ['2041'],
872
+ naicsCodes: ['311211'],
873
+ sector: IndustrySector.AGRIBUSINESS,
874
+ cik: '7084',
875
+ },
876
+ {
877
+ canonicalName: 'DEERE',
878
+ aliases: ['DEERE & CO', 'DEERE AND COMPANY', 'JOHN DEERE', 'DE'],
879
+ sicCodes: ['3523'],
880
+ naicsCodes: ['333111'],
881
+ sector: IndustrySector.AGRIBUSINESS,
882
+ cik: '315189',
883
+ },
884
+ {
885
+ canonicalName: 'MONSANTO',
886
+ aliases: ['MONSANTO CO', 'MONSANTO COMPANY', 'BAYER CROP SCIENCE'],
887
+ sicCodes: ['2870'],
888
+ naicsCodes: ['325320'],
889
+ sector: IndustrySector.AGRIBUSINESS,
890
+ cik: null,
891
+ },
892
+ {
893
+ canonicalName: 'BAYER',
894
+ aliases: ['BAYER AG', 'BAYER CORP', 'BAYER HEALTHCARE', 'BAYRY'],
895
+ sicCodes: ['2834'],
896
+ naicsCodes: ['325412'],
897
+ sector: IndustrySector.HEALTH,
898
+ cik: null,
899
+ },
900
+ // ── Construction ────────────────────────────────────────────────────
901
+ {
902
+ canonicalName: 'BECHTEL',
903
+ aliases: ['BECHTEL GROUP', 'BECHTEL CORP', 'BECHTEL NATIONAL'],
904
+ sicCodes: ['1542'],
905
+ naicsCodes: ['236220'],
906
+ sector: IndustrySector.CONSTRUCTION,
907
+ cik: null,
908
+ },
909
+ {
910
+ canonicalName: 'FLUOR',
911
+ aliases: ['FLUOR CORP', 'FLUOR CORPORATION', 'FLR'],
912
+ sicCodes: ['1542'],
913
+ naicsCodes: ['236220'],
914
+ sector: IndustrySector.CONSTRUCTION,
915
+ cik: '1124198',
916
+ },
917
+ // ── Automotive ──────────────────────────────────────────────────────
918
+ {
919
+ canonicalName: 'GENERAL MOTORS',
920
+ aliases: ['GENERAL MOTORS CO', 'GENERAL MOTORS COMPANY', 'GM'],
921
+ sicCodes: ['3711'],
922
+ naicsCodes: ['336111'],
923
+ sector: IndustrySector.TRANSPORTATION,
924
+ cik: '1467858',
925
+ },
926
+ {
927
+ canonicalName: 'FORD MOTOR',
928
+ aliases: ['FORD MOTOR CO', 'FORD MOTOR COMPANY', 'FORD', 'F'],
929
+ sicCodes: ['3711'],
930
+ naicsCodes: ['336111'],
931
+ sector: IndustrySector.TRANSPORTATION,
932
+ cik: '37996',
933
+ },
934
+ {
935
+ canonicalName: 'TOYOTA',
936
+ aliases: ['TOYOTA MOTOR', 'TOYOTA MOTOR CORP', 'TM', 'TOYOTA MOTOR NORTH AMERICA'],
937
+ sicCodes: ['3711'],
938
+ naicsCodes: ['336111'],
939
+ sector: IndustrySector.TRANSPORTATION,
940
+ cik: '1094517',
941
+ },
942
+ {
943
+ canonicalName: 'STELLANTIS',
944
+ aliases: ['STELLANTIS NV', 'FIAT CHRYSLER', 'CHRYSLER', 'FCA', 'FIAT CHRYSLER AUTOMOBILES'],
945
+ sicCodes: ['3711'],
946
+ naicsCodes: ['336111'],
947
+ sector: IndustrySector.TRANSPORTATION,
948
+ cik: '1513153',
949
+ },
950
+ {
951
+ canonicalName: 'TESLA',
952
+ aliases: ['TESLA INC', 'TESLA MOTORS', 'TSLA'],
953
+ sicCodes: ['3711'],
954
+ naicsCodes: ['336111'],
955
+ sector: IndustrySector.TRANSPORTATION,
956
+ cik: '1318605',
957
+ },
958
+ // ── Tobacco ─────────────────────────────────────────────────────────
959
+ {
960
+ canonicalName: 'PHILIP MORRIS',
961
+ aliases: [
962
+ 'PHILIP MORRIS INTERNATIONAL',
963
+ 'PHILIP MORRIS INTERNATIONAL INC',
964
+ 'PM',
965
+ 'ALTRIA',
966
+ 'ALTRIA GROUP',
967
+ 'ALTRIA GROUP INC',
968
+ 'MO',
969
+ ],
970
+ sicCodes: ['2111'],
971
+ naicsCodes: ['312230'],
972
+ sector: IndustrySector.MISC_BUSINESS,
973
+ cik: '1413329',
974
+ },
975
+ {
976
+ canonicalName: 'REYNOLDS AMERICAN',
977
+ aliases: [
978
+ 'R.J. REYNOLDS',
979
+ 'RJ REYNOLDS',
980
+ 'RJ REYNOLDS TOBACCO',
981
+ 'BRITISH AMERICAN TOBACCO',
982
+ 'BAT',
983
+ ],
984
+ sicCodes: ['2111'],
985
+ naicsCodes: ['312230'],
986
+ sector: IndustrySector.MISC_BUSINESS,
987
+ cik: null,
988
+ },
989
+ // ── Insurance ───────────────────────────────────────────────────────
990
+ {
991
+ canonicalName: 'STATE FARM',
992
+ aliases: ['STATE FARM INSURANCE', 'STATE FARM MUTUAL', 'STATE FARM MUTUAL AUTOMOBILE'],
993
+ sicCodes: ['6311'],
994
+ naicsCodes: ['524126'],
995
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
996
+ cik: null,
997
+ },
998
+ {
999
+ canonicalName: 'ALLSTATE',
1000
+ aliases: ['ALLSTATE CORP', 'THE ALLSTATE CORPORATION', 'ALL'],
1001
+ sicCodes: ['6331'],
1002
+ naicsCodes: ['524126'],
1003
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
1004
+ cik: '899629',
1005
+ },
1006
+ {
1007
+ canonicalName: 'PROGRESSIVE',
1008
+ aliases: ['PROGRESSIVE CORP', 'THE PROGRESSIVE CORPORATION', 'PGR'],
1009
+ sicCodes: ['6331'],
1010
+ naicsCodes: ['524126'],
1011
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
1012
+ cik: '80661',
1013
+ },
1014
+ {
1015
+ canonicalName: 'METLIFE',
1016
+ aliases: ['METLIFE INC', 'METROPOLITAN LIFE', 'MET'],
1017
+ sicCodes: ['6311'],
1018
+ naicsCodes: ['524113'],
1019
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
1020
+ cik: '1099219',
1021
+ },
1022
+ // ── Food & Beverage ─────────────────────────────────────────────────
1023
+ {
1024
+ canonicalName: 'PEPSICO',
1025
+ aliases: ['PEPSICO INC', 'PEPSI', 'FRITO-LAY', 'FRITO LAY', 'PEP'],
1026
+ sicCodes: ['2086'],
1027
+ naicsCodes: ['312111'],
1028
+ sector: IndustrySector.AGRIBUSINESS,
1029
+ cik: '77476',
1030
+ },
1031
+ {
1032
+ canonicalName: 'COCA COLA',
1033
+ aliases: ['THE COCA-COLA COMPANY', 'COCA-COLA', 'COCA COLA CO', 'COKE', 'KO'],
1034
+ sicCodes: ['2086'],
1035
+ naicsCodes: ['312111'],
1036
+ sector: IndustrySector.AGRIBUSINESS,
1037
+ cik: '21344',
1038
+ },
1039
+ {
1040
+ canonicalName: 'NESTLE',
1041
+ aliases: ['NESTLE USA', 'NESTLE SA', 'NSRGY'],
1042
+ sicCodes: ['2024'],
1043
+ naicsCodes: ['311520'],
1044
+ sector: IndustrySector.AGRIBUSINESS,
1045
+ cik: null,
1046
+ },
1047
+ {
1048
+ canonicalName: 'TYSON FOODS',
1049
+ aliases: ['TYSON FOODS INC', 'TYSON', 'TSN'],
1050
+ sicCodes: ['2011'],
1051
+ naicsCodes: ['311611'],
1052
+ sector: IndustrySector.AGRIBUSINESS,
1053
+ cik: '100493',
1054
+ },
1055
+ // ── Labor ───────────────────────────────────────────────────────────
1056
+ {
1057
+ canonicalName: 'AFL-CIO',
1058
+ aliases: ['AMERICAN FEDERATION OF LABOR', 'AFL CIO', 'AFLCIO'],
1059
+ sicCodes: [],
1060
+ naicsCodes: ['813930'],
1061
+ sector: IndustrySector.LABOR,
1062
+ cik: null,
1063
+ },
1064
+ {
1065
+ canonicalName: 'SEIU',
1066
+ aliases: ['SERVICE EMPLOYEES INTERNATIONAL UNION', 'SERVICE EMPLOYEES INTL UNION'],
1067
+ sicCodes: [],
1068
+ naicsCodes: ['813930'],
1069
+ sector: IndustrySector.LABOR,
1070
+ cik: null,
1071
+ },
1072
+ {
1073
+ canonicalName: 'TEAMSTERS',
1074
+ aliases: ['INTERNATIONAL BROTHERHOOD OF TEAMSTERS', 'IBT'],
1075
+ sicCodes: [],
1076
+ naicsCodes: ['813930'],
1077
+ sector: IndustrySector.LABOR,
1078
+ cik: null,
1079
+ },
1080
+ {
1081
+ canonicalName: 'UAW',
1082
+ aliases: [
1083
+ 'UNITED AUTO WORKERS',
1084
+ 'UNITED AUTOMOBILE WORKERS',
1085
+ 'INTERNATIONAL UNION UNITED AUTOMOBILE',
1086
+ ],
1087
+ sicCodes: [],
1088
+ naicsCodes: ['813930'],
1089
+ sector: IndustrySector.LABOR,
1090
+ cik: null,
1091
+ },
1092
+ // ── Trade Associations ──────────────────────────────────────────────
1093
+ {
1094
+ canonicalName: 'US CHAMBER OF COMMERCE',
1095
+ aliases: [
1096
+ 'CHAMBER OF COMMERCE OF THE UNITED STATES',
1097
+ 'U.S. CHAMBER OF COMMERCE',
1098
+ 'UNITED STATES CHAMBER OF COMMERCE',
1099
+ 'USCOC',
1100
+ ],
1101
+ sicCodes: [],
1102
+ naicsCodes: ['813910'],
1103
+ sector: IndustrySector.MISC_BUSINESS,
1104
+ cik: null,
1105
+ },
1106
+ {
1107
+ canonicalName: 'NATIONAL ASSOCIATION OF REALTORS',
1108
+ aliases: ['NAR', 'NATL ASSN OF REALTORS', 'REALTORS PAC'],
1109
+ sicCodes: [],
1110
+ naicsCodes: ['813910'],
1111
+ sector: IndustrySector.FINANCE_INSURANCE_REAL_ESTATE,
1112
+ cik: null,
1113
+ },
1114
+ {
1115
+ canonicalName: 'AMERICAN MEDICAL ASSOCIATION',
1116
+ aliases: ['AMA', 'AMPAC'],
1117
+ sicCodes: [],
1118
+ naicsCodes: ['813920'],
1119
+ sector: IndustrySector.HEALTH,
1120
+ cik: null,
1121
+ },
1122
+ {
1123
+ canonicalName: 'AMERICAN HOSPITAL ASSOCIATION',
1124
+ aliases: ['AHA', 'AM HOSPITAL ASSN'],
1125
+ sicCodes: [],
1126
+ naicsCodes: ['813920'],
1127
+ sector: IndustrySector.HEALTH,
1128
+ cik: null,
1129
+ },
1130
+ {
1131
+ canonicalName: 'PHRMA',
1132
+ aliases: [
1133
+ 'PHARMACEUTICAL RESEARCH AND MANUFACTURERS OF AMERICA',
1134
+ 'PHARMACEUTICAL RESEARCH & MANUFACTURERS',
1135
+ 'PHARMA',
1136
+ ],
1137
+ sicCodes: [],
1138
+ naicsCodes: ['813910'],
1139
+ sector: IndustrySector.HEALTH,
1140
+ cik: null,
1141
+ },
1142
+ {
1143
+ canonicalName: 'AMERICAN PETROLEUM INSTITUTE',
1144
+ aliases: ['API', 'AMER PETROLEUM INST'],
1145
+ sicCodes: [],
1146
+ naicsCodes: ['813910'],
1147
+ sector: IndustrySector.ENERGY_NATURAL_RESOURCES,
1148
+ cik: null,
1149
+ },
1150
+ {
1151
+ canonicalName: 'NATIONAL RIFLE ASSOCIATION',
1152
+ aliases: ['NRA', 'NRA OF AMERICA', 'NRA POLITICAL VICTORY FUND'],
1153
+ sicCodes: [],
1154
+ naicsCodes: ['813410'],
1155
+ sector: IndustrySector.IDEOLOGY_SINGLE_ISSUE,
1156
+ cik: null,
1157
+ },
1158
+ {
1159
+ canonicalName: 'AARP',
1160
+ aliases: ['AMERICAN ASSOCIATION OF RETIRED PERSONS'],
1161
+ sicCodes: [],
1162
+ naicsCodes: ['813410'],
1163
+ sector: IndustrySector.IDEOLOGY_SINGLE_ISSUE,
1164
+ cik: null,
1165
+ },
1166
+ {
1167
+ canonicalName: 'NATIONAL ASSOCIATION OF MANUFACTURERS',
1168
+ aliases: ['NAM', 'NATL ASSN OF MANUFACTURERS'],
1169
+ sicCodes: [],
1170
+ naicsCodes: ['813910'],
1171
+ sector: IndustrySector.MISC_BUSINESS,
1172
+ cik: null,
1173
+ },
1174
+ {
1175
+ canonicalName: 'BUSINESS ROUNDTABLE',
1176
+ aliases: ['BRT'],
1177
+ sicCodes: [],
1178
+ naicsCodes: ['813910'],
1179
+ sector: IndustrySector.MISC_BUSINESS,
1180
+ cik: null,
1181
+ },
1182
+ {
1183
+ canonicalName: 'BLUE CROSS BLUE SHIELD',
1184
+ aliases: ['BLUE CROSS AND BLUE SHIELD', 'BCBS', 'BLUE CROSS BLUE SHIELD ASSOCIATION', 'BCBSA'],
1185
+ sicCodes: ['6324'],
1186
+ naicsCodes: ['524114'],
1187
+ sector: IndustrySector.HEALTH,
1188
+ cik: null,
1189
+ },
1190
+ // ── Media & Entertainment ───────────────────────────────────────────
1191
+ {
1192
+ canonicalName: 'WALT DISNEY',
1193
+ aliases: ['THE WALT DISNEY COMPANY', 'DISNEY', 'WALT DISNEY CO', 'DIS'],
1194
+ sicCodes: ['7812'],
1195
+ naicsCodes: ['512110'],
1196
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
1197
+ cik: '1744489',
1198
+ },
1199
+ {
1200
+ canonicalName: 'WARNER BROS DISCOVERY',
1201
+ aliases: [
1202
+ 'WARNER BROS',
1203
+ 'WARNER MEDIA',
1204
+ 'WARNERMEDIA',
1205
+ 'WBD',
1206
+ 'DISCOVERY INC',
1207
+ 'AT&T WARNERMEDIA',
1208
+ ],
1209
+ sicCodes: ['4841'],
1210
+ naicsCodes: ['512110'],
1211
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
1212
+ cik: '1437107',
1213
+ },
1214
+ {
1215
+ canonicalName: 'PARAMOUNT',
1216
+ aliases: ['PARAMOUNT GLOBAL', 'VIACOM', 'VIACOMBSCBS', 'CBS', 'PARA'],
1217
+ sicCodes: ['4841'],
1218
+ naicsCodes: ['512110'],
1219
+ sector: IndustrySector.COMMUNICATIONS_ELECTRONICS,
1220
+ cik: '813828',
1221
+ },
1222
+ // ── Lawyers & Lobbyists ─────────────────────────────────────────────
1223
+ {
1224
+ canonicalName: 'AKIN GUMP',
1225
+ aliases: [
1226
+ 'AKIN GUMP STRAUSS HAUER AND FELD',
1227
+ 'AKIN GUMP STRAUSS HAUER & FELD',
1228
+ 'AKIN GUMP STRAUSS',
1229
+ ],
1230
+ sicCodes: ['8111'],
1231
+ naicsCodes: ['541110'],
1232
+ sector: IndustrySector.LAWYERS_LOBBYISTS,
1233
+ cik: null,
1234
+ },
1235
+ {
1236
+ canonicalName: 'SQUIRE PATTON BOGGS',
1237
+ aliases: ['SQUIRE PATTON BOGGS LLP', 'PATTON BOGGS', 'SQUIRE SANDERS'],
1238
+ sicCodes: ['8111'],
1239
+ naicsCodes: ['541110'],
1240
+ sector: IndustrySector.LAWYERS_LOBBYISTS,
1241
+ cik: null,
1242
+ },
1243
+ {
1244
+ canonicalName: 'BROWNSTEIN HYATT',
1245
+ aliases: ['BROWNSTEIN HYATT FARBER SCHRECK', 'BROWNSTEIN HYATT FARBER SCHRECK LLP'],
1246
+ sicCodes: ['8111'],
1247
+ naicsCodes: ['541110'],
1248
+ sector: IndustrySector.LAWYERS_LOBBYISTS,
1249
+ cik: null,
1250
+ },
1251
+ {
1252
+ canonicalName: 'HOLLAND AND KNIGHT',
1253
+ aliases: ['HOLLAND & KNIGHT', 'HOLLAND & KNIGHT LLP'],
1254
+ sicCodes: ['8111'],
1255
+ naicsCodes: ['541110'],
1256
+ sector: IndustrySector.LAWYERS_LOBBYISTS,
1257
+ cik: null,
1258
+ },
1259
+ {
1260
+ canonicalName: 'K STREET PARTNERS',
1261
+ aliases: ['K&L GATES', 'K AND L GATES'],
1262
+ sicCodes: ['8111'],
1263
+ naicsCodes: ['541110'],
1264
+ sector: IndustrySector.LAWYERS_LOBBYISTS,
1265
+ cik: null,
1266
+ },
1267
+ ];
1268
+ /**
1269
+ * Case-insensitive lookup index: normalized alias → CompanyAlias.
1270
+ * Built once at module load.
1271
+ */
1272
+ const ALIAS_INDEX = new Map();
1273
+ for (const entry of COMPANY_ALIAS_TABLE) {
1274
+ // Index the canonical name itself
1275
+ ALIAS_INDEX.set(entry.canonicalName.toUpperCase(), entry);
1276
+ // Index every alias
1277
+ for (const alias of entry.aliases) {
1278
+ ALIAS_INDEX.set(alias.toUpperCase(), entry);
1279
+ }
1280
+ }
1281
+ /**
1282
+ * Corporate suffix pattern for stripping before lookup.
1283
+ */
1284
+ const STRIP_SUFFIX = /\b(inc|llc|llp|corp|lp|ltd|co|company|corporation|incorporated|limited|plc|sa|ag|gmbh)\b\.?/gi;
1285
+ /**
1286
+ * Look up a company by any known alias.
1287
+ * Normalizes the input (strips suffixes, punctuation) before matching.
1288
+ * Returns the CompanyAlias entry or null if not found.
1289
+ */
1290
+ export function findCompanyByAlias(name) {
1291
+ if (!name?.trim())
1292
+ return null;
1293
+ // Try direct lookup first
1294
+ const upper = name.trim().toUpperCase();
1295
+ const direct = ALIAS_INDEX.get(upper);
1296
+ if (direct)
1297
+ return direct;
1298
+ // Strip suffixes and punctuation, then retry
1299
+ const cleaned = upper
1300
+ .replace(STRIP_SUFFIX, '')
1301
+ .replace(/&/g, ' AND ')
1302
+ .replace(/[^\w\s]/g, '')
1303
+ .replace(/\s+/g, ' ')
1304
+ .trim();
1305
+ return ALIAS_INDEX.get(cleaned) ?? null;
1306
+ }
1307
+ //# sourceMappingURL=company-alias-table.js.map