@mailwoman/neural-weights-en-us 4.0.0 → 4.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,495 @@
1
+ {
2
+ "model": "neural-weights-en-us",
3
+ "model_version": "4.0.0",
4
+ "method": "per-locale isotonic (PAVA)",
5
+ "tables": {
6
+ "DE": [
7
+ {
8
+ "lo": 0.0,
9
+ "hi": 0.05,
10
+ "center": 0.025,
11
+ "calibrated": 0.8333333333333334
12
+ },
13
+ {
14
+ "lo": 0.05,
15
+ "hi": 0.1,
16
+ "center": 0.07500000000000001,
17
+ "calibrated": 0.8333333333333334
18
+ },
19
+ {
20
+ "lo": 0.1,
21
+ "hi": 0.15000000000000002,
22
+ "center": 0.125,
23
+ "calibrated": 0.8333333333333334
24
+ },
25
+ {
26
+ "lo": 0.15000000000000002,
27
+ "hi": 0.2,
28
+ "center": 0.17500000000000002,
29
+ "calibrated": 0.8333333333333334
30
+ },
31
+ {
32
+ "lo": 0.2,
33
+ "hi": 0.25,
34
+ "center": 0.225,
35
+ "calibrated": 0.8333333333333334
36
+ },
37
+ {
38
+ "lo": 0.25,
39
+ "hi": 0.30000000000000004,
40
+ "center": 0.275,
41
+ "calibrated": 0.8333333333333334
42
+ },
43
+ {
44
+ "lo": 0.30000000000000004,
45
+ "hi": 0.35000000000000003,
46
+ "center": 0.32500000000000007,
47
+ "calibrated": 0.8333333333333334
48
+ },
49
+ {
50
+ "lo": 0.35000000000000003,
51
+ "hi": 0.4,
52
+ "center": 0.375,
53
+ "calibrated": 0.8333333333333334
54
+ },
55
+ {
56
+ "lo": 0.4,
57
+ "hi": 0.45,
58
+ "center": 0.42500000000000004,
59
+ "calibrated": 0.8333333333333334
60
+ },
61
+ {
62
+ "lo": 0.45,
63
+ "hi": 0.5,
64
+ "center": 0.475,
65
+ "calibrated": 0.8333333333333334
66
+ },
67
+ {
68
+ "lo": 0.5,
69
+ "hi": 0.55,
70
+ "center": 0.525,
71
+ "calibrated": 0.8333333333333334
72
+ },
73
+ {
74
+ "lo": 0.55,
75
+ "hi": 0.6000000000000001,
76
+ "center": 0.5750000000000001,
77
+ "calibrated": 0.8333333333333334
78
+ },
79
+ {
80
+ "lo": 0.6000000000000001,
81
+ "hi": 0.65,
82
+ "center": 0.625,
83
+ "calibrated": 0.8333333333333334
84
+ },
85
+ {
86
+ "lo": 0.65,
87
+ "hi": 0.7000000000000001,
88
+ "center": 0.675,
89
+ "calibrated": 0.8333333333333334
90
+ },
91
+ {
92
+ "lo": 0.7000000000000001,
93
+ "hi": 0.75,
94
+ "center": 0.7250000000000001,
95
+ "calibrated": 0.8524173027989822
96
+ },
97
+ {
98
+ "lo": 0.75,
99
+ "hi": 0.8,
100
+ "center": 0.775,
101
+ "calibrated": 0.8524173027989822
102
+ },
103
+ {
104
+ "lo": 0.8,
105
+ "hi": 0.8500000000000001,
106
+ "center": 0.8250000000000001,
107
+ "calibrated": 0.8524173027989822
108
+ },
109
+ {
110
+ "lo": 0.8500000000000001,
111
+ "hi": 0.9,
112
+ "center": 0.875,
113
+ "calibrated": 0.8524173027989822
114
+ },
115
+ {
116
+ "lo": 0.9,
117
+ "hi": 0.9500000000000001,
118
+ "center": 0.925,
119
+ "calibrated": 0.8524173027989822
120
+ },
121
+ {
122
+ "lo": 0.9500000000000001,
123
+ "hi": 1.0,
124
+ "center": 0.9750000000000001,
125
+ "calibrated": 0.8524173027989822
126
+ }
127
+ ],
128
+ "FR": [
129
+ {
130
+ "lo": 0.0,
131
+ "hi": 0.05,
132
+ "center": 0.025,
133
+ "calibrated": 0.7916666666666666
134
+ },
135
+ {
136
+ "lo": 0.05,
137
+ "hi": 0.1,
138
+ "center": 0.07500000000000001,
139
+ "calibrated": 0.7916666666666666
140
+ },
141
+ {
142
+ "lo": 0.1,
143
+ "hi": 0.15000000000000002,
144
+ "center": 0.125,
145
+ "calibrated": 0.7916666666666666
146
+ },
147
+ {
148
+ "lo": 0.15000000000000002,
149
+ "hi": 0.2,
150
+ "center": 0.17500000000000002,
151
+ "calibrated": 0.7916666666666666
152
+ },
153
+ {
154
+ "lo": 0.2,
155
+ "hi": 0.25,
156
+ "center": 0.225,
157
+ "calibrated": 0.7916666666666666
158
+ },
159
+ {
160
+ "lo": 0.25,
161
+ "hi": 0.30000000000000004,
162
+ "center": 0.275,
163
+ "calibrated": 0.7916666666666666
164
+ },
165
+ {
166
+ "lo": 0.30000000000000004,
167
+ "hi": 0.35000000000000003,
168
+ "center": 0.32500000000000007,
169
+ "calibrated": 0.7916666666666666
170
+ },
171
+ {
172
+ "lo": 0.35000000000000003,
173
+ "hi": 0.4,
174
+ "center": 0.375,
175
+ "calibrated": 0.7916666666666666
176
+ },
177
+ {
178
+ "lo": 0.4,
179
+ "hi": 0.45,
180
+ "center": 0.42500000000000004,
181
+ "calibrated": 0.7916666666666666
182
+ },
183
+ {
184
+ "lo": 0.45,
185
+ "hi": 0.5,
186
+ "center": 0.475,
187
+ "calibrated": 0.7916666666666666
188
+ },
189
+ {
190
+ "lo": 0.5,
191
+ "hi": 0.55,
192
+ "center": 0.525,
193
+ "calibrated": 0.9
194
+ },
195
+ {
196
+ "lo": 0.55,
197
+ "hi": 0.6000000000000001,
198
+ "center": 0.5750000000000001,
199
+ "calibrated": 0.9508196721311475
200
+ },
201
+ {
202
+ "lo": 0.6000000000000001,
203
+ "hi": 0.65,
204
+ "center": 0.625,
205
+ "calibrated": 0.9508196721311475
206
+ },
207
+ {
208
+ "lo": 0.65,
209
+ "hi": 0.7000000000000001,
210
+ "center": 0.675,
211
+ "calibrated": 0.9508196721311475
212
+ },
213
+ {
214
+ "lo": 0.7000000000000001,
215
+ "hi": 0.75,
216
+ "center": 0.7250000000000001,
217
+ "calibrated": 0.9523809523809523
218
+ },
219
+ {
220
+ "lo": 0.75,
221
+ "hi": 0.8,
222
+ "center": 0.775,
223
+ "calibrated": 0.9523809523809523
224
+ },
225
+ {
226
+ "lo": 0.8,
227
+ "hi": 0.8500000000000001,
228
+ "center": 0.8250000000000001,
229
+ "calibrated": 0.9523809523809523
230
+ },
231
+ {
232
+ "lo": 0.8500000000000001,
233
+ "hi": 0.9,
234
+ "center": 0.875,
235
+ "calibrated": 0.9523809523809523
236
+ },
237
+ {
238
+ "lo": 0.9,
239
+ "hi": 0.9500000000000001,
240
+ "center": 0.925,
241
+ "calibrated": 0.9843614248479583
242
+ },
243
+ {
244
+ "lo": 0.9500000000000001,
245
+ "hi": 1.0,
246
+ "center": 0.9750000000000001,
247
+ "calibrated": 0.9916666666666667
248
+ }
249
+ ],
250
+ "NL": [
251
+ {
252
+ "lo": 0.0,
253
+ "hi": 0.05,
254
+ "center": 0.025,
255
+ "calibrated": 0.2
256
+ },
257
+ {
258
+ "lo": 0.05,
259
+ "hi": 0.1,
260
+ "center": 0.07500000000000001,
261
+ "calibrated": 0.2
262
+ },
263
+ {
264
+ "lo": 0.1,
265
+ "hi": 0.15000000000000002,
266
+ "center": 0.125,
267
+ "calibrated": 0.2
268
+ },
269
+ {
270
+ "lo": 0.15000000000000002,
271
+ "hi": 0.2,
272
+ "center": 0.17500000000000002,
273
+ "calibrated": 0.2
274
+ },
275
+ {
276
+ "lo": 0.2,
277
+ "hi": 0.25,
278
+ "center": 0.225,
279
+ "calibrated": 0.2
280
+ },
281
+ {
282
+ "lo": 0.25,
283
+ "hi": 0.30000000000000004,
284
+ "center": 0.275,
285
+ "calibrated": 0.2
286
+ },
287
+ {
288
+ "lo": 0.30000000000000004,
289
+ "hi": 0.35000000000000003,
290
+ "center": 0.32500000000000007,
291
+ "calibrated": 0.2
292
+ },
293
+ {
294
+ "lo": 0.35000000000000003,
295
+ "hi": 0.4,
296
+ "center": 0.375,
297
+ "calibrated": 0.8947368421052632
298
+ },
299
+ {
300
+ "lo": 0.4,
301
+ "hi": 0.45,
302
+ "center": 0.42500000000000004,
303
+ "calibrated": 0.8947368421052632
304
+ },
305
+ {
306
+ "lo": 0.45,
307
+ "hi": 0.5,
308
+ "center": 0.475,
309
+ "calibrated": 0.8947368421052632
310
+ },
311
+ {
312
+ "lo": 0.5,
313
+ "hi": 0.55,
314
+ "center": 0.525,
315
+ "calibrated": 0.8947368421052632
316
+ },
317
+ {
318
+ "lo": 0.55,
319
+ "hi": 0.6000000000000001,
320
+ "center": 0.5750000000000001,
321
+ "calibrated": 0.9985590778097982
322
+ },
323
+ {
324
+ "lo": 0.6000000000000001,
325
+ "hi": 0.65,
326
+ "center": 0.625,
327
+ "calibrated": 0.9985590778097982
328
+ },
329
+ {
330
+ "lo": 0.65,
331
+ "hi": 0.7000000000000001,
332
+ "center": 0.675,
333
+ "calibrated": 0.9985590778097982
334
+ },
335
+ {
336
+ "lo": 0.7000000000000001,
337
+ "hi": 0.75,
338
+ "center": 0.7250000000000001,
339
+ "calibrated": 0.9985590778097982
340
+ },
341
+ {
342
+ "lo": 0.75,
343
+ "hi": 0.8,
344
+ "center": 0.775,
345
+ "calibrated": 0.9985590778097982
346
+ },
347
+ {
348
+ "lo": 0.8,
349
+ "hi": 0.8500000000000001,
350
+ "center": 0.8250000000000001,
351
+ "calibrated": 0.9985590778097982
352
+ },
353
+ {
354
+ "lo": 0.8500000000000001,
355
+ "hi": 0.9,
356
+ "center": 0.875,
357
+ "calibrated": 0.9985590778097982
358
+ },
359
+ {
360
+ "lo": 0.9,
361
+ "hi": 0.9500000000000001,
362
+ "center": 0.925,
363
+ "calibrated": 0.9985590778097982
364
+ },
365
+ {
366
+ "lo": 0.9500000000000001,
367
+ "hi": 1.0,
368
+ "center": 0.9750000000000001,
369
+ "calibrated": 1.0
370
+ }
371
+ ],
372
+ "US": [
373
+ {
374
+ "lo": 0.0,
375
+ "hi": 0.05,
376
+ "center": 0.025,
377
+ "calibrated": 0.0
378
+ },
379
+ {
380
+ "lo": 0.05,
381
+ "hi": 0.1,
382
+ "center": 0.07500000000000001,
383
+ "calibrated": 0.0
384
+ },
385
+ {
386
+ "lo": 0.1,
387
+ "hi": 0.15000000000000002,
388
+ "center": 0.125,
389
+ "calibrated": 0.0
390
+ },
391
+ {
392
+ "lo": 0.15000000000000002,
393
+ "hi": 0.2,
394
+ "center": 0.17500000000000002,
395
+ "calibrated": 0.3333333333333333
396
+ },
397
+ {
398
+ "lo": 0.2,
399
+ "hi": 0.25,
400
+ "center": 0.225,
401
+ "calibrated": 0.3333333333333333
402
+ },
403
+ {
404
+ "lo": 0.25,
405
+ "hi": 0.30000000000000004,
406
+ "center": 0.275,
407
+ "calibrated": 0.3333333333333333
408
+ },
409
+ {
410
+ "lo": 0.30000000000000004,
411
+ "hi": 0.35000000000000003,
412
+ "center": 0.32500000000000007,
413
+ "calibrated": 0.417910447761194
414
+ },
415
+ {
416
+ "lo": 0.35000000000000003,
417
+ "hi": 0.4,
418
+ "center": 0.375,
419
+ "calibrated": 0.417910447761194
420
+ },
421
+ {
422
+ "lo": 0.4,
423
+ "hi": 0.45,
424
+ "center": 0.42500000000000004,
425
+ "calibrated": 0.48717948717948717
426
+ },
427
+ {
428
+ "lo": 0.45,
429
+ "hi": 0.5,
430
+ "center": 0.475,
431
+ "calibrated": 0.6785714285714286
432
+ },
433
+ {
434
+ "lo": 0.5,
435
+ "hi": 0.55,
436
+ "center": 0.525,
437
+ "calibrated": 0.75
438
+ },
439
+ {
440
+ "lo": 0.55,
441
+ "hi": 0.6000000000000001,
442
+ "center": 0.5750000000000001,
443
+ "calibrated": 0.7755102040816326
444
+ },
445
+ {
446
+ "lo": 0.6000000000000001,
447
+ "hi": 0.65,
448
+ "center": 0.625,
449
+ "calibrated": 0.8554913294797688
450
+ },
451
+ {
452
+ "lo": 0.65,
453
+ "hi": 0.7000000000000001,
454
+ "center": 0.675,
455
+ "calibrated": 0.8984547461368654
456
+ },
457
+ {
458
+ "lo": 0.7000000000000001,
459
+ "hi": 0.75,
460
+ "center": 0.7250000000000001,
461
+ "calibrated": 0.8984547461368654
462
+ },
463
+ {
464
+ "lo": 0.75,
465
+ "hi": 0.8,
466
+ "center": 0.775,
467
+ "calibrated": 0.9469026548672567
468
+ },
469
+ {
470
+ "lo": 0.8,
471
+ "hi": 0.8500000000000001,
472
+ "center": 0.8250000000000001,
473
+ "calibrated": 0.9577092511013215
474
+ },
475
+ {
476
+ "lo": 0.8500000000000001,
477
+ "hi": 0.9,
478
+ "center": 0.875,
479
+ "calibrated": 0.9694719471947195
480
+ },
481
+ {
482
+ "lo": 0.9,
483
+ "hi": 0.9500000000000001,
484
+ "center": 0.925,
485
+ "calibrated": 0.9838576158940397
486
+ },
487
+ {
488
+ "lo": 0.9500000000000001,
489
+ "hi": 1.0,
490
+ "center": 0.9750000000000001,
491
+ "calibrated": 1.0
492
+ }
493
+ ]
494
+ }
495
+ }
@@ -0,0 +1,243 @@
1
+ {
2
+ "model": "neural-weights-en-us",
3
+ "model_version": "4.0.0",
4
+ "method": "isotonic-regression (PAVA) over per-span softmax confidence",
5
+ "created_from": "data/eval/calibration/confidences.jsonl",
6
+ "n_total": 32553,
7
+ "n_fit": 26043,
8
+ "n_eval": 6510,
9
+ "bins": 20,
10
+ "ece_bins": 15,
11
+ "metrics": {
12
+ "ece_raw_eval": 0.06733768396482998,
13
+ "ece_cal_eval": 0.003516504997239885,
14
+ "mce_raw_eval": 0.289115488729766,
15
+ "mce_cal_eval": 0.18286826492482933,
16
+ "mce_raw_eval_allbins": 0.8454483055409481,
17
+ "mce_cal_eval_allbins": 0.953985808965804,
18
+ "brier_raw_eval": 0.033950582453368766,
19
+ "brier_cal_eval": 0.027009249299634375,
20
+ "ece_raw_oa_eval": 0.07058600158908206,
21
+ "ece_cal_oa_eval": 0.006727186537647182,
22
+ "ece_raw_corpus_eval": 0.06592097892553006,
23
+ "ece_cal_corpus_eval": 0.006108435118670848
24
+ },
25
+ "per_tag_ece": {
26
+ "house_number": {
27
+ "n": 783,
28
+ "acc": 0.8876117496807152,
29
+ "ece_raw": 0.032203530366151964,
30
+ "ece_cal": 0.08212837028751453
31
+ },
32
+ "locality": {
33
+ "n": 1668,
34
+ "acc": 0.9724220623501199,
35
+ "ece_raw": 0.07590628618691278,
36
+ "ece_cal": 0.008323214057649167
37
+ },
38
+ "postcode": {
39
+ "n": 1547,
40
+ "acc": 0.9993535875888817,
41
+ "ece_raw": 0.08926967886821484,
42
+ "ece_cal": 0.022650235312503323
43
+ },
44
+ "region": {
45
+ "n": 1219,
46
+ "acc": 0.9975389663658737,
47
+ "ece_raw": 0.06392376399526842,
48
+ "ece_cal": 0.018509232370423873
49
+ },
50
+ "street": {
51
+ "n": 817,
52
+ "acc": 0.9645042839657283,
53
+ "ece_raw": 0.06236517084448636,
54
+ "ece_cal": 0.017999489099532674
55
+ },
56
+ "venue": {
57
+ "n": 434,
58
+ "acc": 0.9308755760368663,
59
+ "ece_raw": 0.11384168006361704,
60
+ "ece_cal": 0.0429750111796866
61
+ }
62
+ },
63
+ "per_locale_ece": {
64
+ "DE": {
65
+ "n": 195,
66
+ "acc": 0.8871794871794871,
67
+ "ece_raw": 0.11113936337159339,
68
+ "ece_cal": 0.09729335740608726
69
+ },
70
+ "FR": {
71
+ "n": 803,
72
+ "acc": 0.9663760896637609,
73
+ "ece_raw": 0.05943714249530754,
74
+ "ece_cal": 0.016894667938069707
75
+ },
76
+ "NL": {
77
+ "n": 192,
78
+ "acc": 0.9947916666666666,
79
+ "ece_raw": 0.17864070987172176,
80
+ "ece_cal": 0.046454384545716376
81
+ },
82
+ "US": {
83
+ "n": 5320,
84
+ "acc": 0.9719924812030075,
85
+ "ece_raw": 0.06844507512699036,
86
+ "ece_cal": 0.006977205495182824
87
+ }
88
+ },
89
+ "abstention_curve": [
90
+ {
91
+ "threshold": 0.5,
92
+ "coverage": 0.9940092165898617,
93
+ "precision": 0.9720290526966465,
94
+ "reviewed": 0.005990783410138256
95
+ },
96
+ {
97
+ "threshold": 0.8,
98
+ "coverage": 0.9824884792626728,
99
+ "precision": 0.9763914946841776,
100
+ "reviewed": 0.017511520737327202
101
+ },
102
+ {
103
+ "threshold": 0.9,
104
+ "coverage": 0.9646697388632872,
105
+ "precision": 0.9781847133757962,
106
+ "reviewed": 0.03533026113671278
107
+ },
108
+ {
109
+ "threshold": 0.95,
110
+ "coverage": 0.9419354838709677,
111
+ "precision": 0.9796151337247228,
112
+ "reviewed": 0.058064516129032295
113
+ },
114
+ {
115
+ "threshold": 0.97,
116
+ "coverage": 0.7308755760368664,
117
+ "precision": 0.9844472467423288,
118
+ "reviewed": 0.26912442396313363
119
+ }
120
+ ],
121
+ "table": [
122
+ {
123
+ "lo": 0.0,
124
+ "hi": 0.05,
125
+ "center": 0.025,
126
+ "calibrated": 0.0
127
+ },
128
+ {
129
+ "lo": 0.05,
130
+ "hi": 0.1,
131
+ "center": 0.07500000000000001,
132
+ "calibrated": 0.0
133
+ },
134
+ {
135
+ "lo": 0.1,
136
+ "hi": 0.15000000000000002,
137
+ "center": 0.125,
138
+ "calibrated": 0.0
139
+ },
140
+ {
141
+ "lo": 0.15000000000000002,
142
+ "hi": 0.2,
143
+ "center": 0.17500000000000002,
144
+ "calibrated": 0.21099134690621654
145
+ },
146
+ {
147
+ "lo": 0.2,
148
+ "hi": 0.25,
149
+ "center": 0.225,
150
+ "calibrated": 0.34782608695652173
151
+ },
152
+ {
153
+ "lo": 0.25,
154
+ "hi": 0.30000000000000004,
155
+ "center": 0.275,
156
+ "calibrated": 0.34782608695652173
157
+ },
158
+ {
159
+ "lo": 0.30000000000000004,
160
+ "hi": 0.35000000000000003,
161
+ "center": 0.32500000000000007,
162
+ "calibrated": 0.425
163
+ },
164
+ {
165
+ "lo": 0.35000000000000003,
166
+ "hi": 0.4,
167
+ "center": 0.375,
168
+ "calibrated": 0.425531914893617
169
+ },
170
+ {
171
+ "lo": 0.4,
172
+ "hi": 0.45,
173
+ "center": 0.42500000000000004,
174
+ "calibrated": 0.5208333333333334
175
+ },
176
+ {
177
+ "lo": 0.45,
178
+ "hi": 0.5,
179
+ "center": 0.475,
180
+ "calibrated": 0.7380952380952381
181
+ },
182
+ {
183
+ "lo": 0.5,
184
+ "hi": 0.55,
185
+ "center": 0.525,
186
+ "calibrated": 0.7761194029850746
187
+ },
188
+ {
189
+ "lo": 0.55,
190
+ "hi": 0.6000000000000001,
191
+ "center": 0.5750000000000001,
192
+ "calibrated": 0.84
193
+ },
194
+ {
195
+ "lo": 0.6000000000000001,
196
+ "hi": 0.65,
197
+ "center": 0.625,
198
+ "calibrated": 0.8511627906976744
199
+ },
200
+ {
201
+ "lo": 0.65,
202
+ "hi": 0.7000000000000001,
203
+ "center": 0.675,
204
+ "calibrated": 0.9238095238095239
205
+ },
206
+ {
207
+ "lo": 0.7000000000000001,
208
+ "hi": 0.75,
209
+ "center": 0.7250000000000001,
210
+ "calibrated": 0.9246323529411765
211
+ },
212
+ {
213
+ "lo": 0.75,
214
+ "hi": 0.8,
215
+ "center": 0.775,
216
+ "calibrated": 0.9568
217
+ },
218
+ {
219
+ "lo": 0.8,
220
+ "hi": 0.8500000000000001,
221
+ "center": 0.8250000000000001,
222
+ "calibrated": 0.9625668449197861
223
+ },
224
+ {
225
+ "lo": 0.8500000000000001,
226
+ "hi": 0.9,
227
+ "center": 0.875,
228
+ "calibrated": 0.9693251533742331
229
+ },
230
+ {
231
+ "lo": 0.9,
232
+ "hi": 0.9500000000000001,
233
+ "center": 0.925,
234
+ "calibrated": 0.9826212889210717
235
+ },
236
+ {
237
+ "lo": 0.9500000000000001,
238
+ "hi": 1.0,
239
+ "center": 0.9750000000000001,
240
+ "calibrated": 0.9856649395509499
241
+ }
242
+ ]
243
+ }
package/model-card.json CHANGED
@@ -1,17 +1,17 @@
1
1
  {
2
2
  "name": "neural-weights-en-us",
3
- "version": "4.0.0",
4
- "model_lineage": "Stage 3 / step 100000 (formerly v0.6.0) \u2014 relabeled to the unified 4.0.0 release version; tokenizer 0.6.0-a0",
5
- "phase": "Stage 3 \u2014 street decomposition + PO box + intersection",
3
+ "version": "4.2.0",
4
+ "model_lineage": "v1.0.2-consolidation-runB / step 20000 — consolidation of the parity campaign (unit + affix + country gazetteer-anchor + multi-locale balance) init_from consolidation v1.0.0 step-040000 (fresh optimizer — NOT resume; recorded honestly, see docs/articles/evals/2026-06-10-consolidation-session.md) @ affix 17x on corpus v0.4.12-consolidation — shipped as the unified 4.2.0 release version; tokenizer 0.6.0-a0",
5
+ "phase": "Stage 3 v1.0 consolidation: parity flag-plant (spine + country anchor + affix existence)",
6
6
  "license": "AGPL-3.0-only",
7
7
  "locale": "en-us",
8
8
  "training": {
9
- "corpus_version": "0.4.0+stage3",
9
+ "corpus_version": "0.4.12-consolidation",
10
10
  "tokenizer_version": "0.6.0-a0",
11
- "steps": 100000,
12
- "best_step": 100000,
11
+ "steps": 20000,
12
+ "best_step": 20000,
13
13
  "hardware": "NVIDIA A100-SXM4-40GB (Modal cloud)",
14
- "recipe": "v0.5.1 base + STAGE3 (33 BIO labels) + synth-po-box source @ 1.5x. CE-only (crf_loss_weight=0.0 after two NaN attempts with crf>0; the 33x33 transition table + bf16 was numerically unstable). lr=1.5e-4 constant, warmup=1000."
14
+ "recipe": "Run B of the consolidation campaign: init_from the clean v1.0.0 consolidation step-040000 (every proven lever: unit shard, affix-ml shard, country balanced shard + gazetteer soft anchor + channel choreography, both-order German), synth-affix 17x, 20k steps, CE-only, lr=1.5e-4, seed 42. Selected over v1.0.0/A/C at the fork: strongest stable variant (US postcode 97.3, country 89.8, FR hn 94.6). STATED RE-BASELINES vs canonical bars: affix 64.9/48.8 (vs 78/67), US street 76.2 (vs 80.4), unit 90.6 (vs 92) — measured 29M stability ceiling, see issue #492. GATE NUMBERS ARE REPAIRS-OFF (#486). Eval procedure REQUIRES --gazetteer-lexicon + --suppress-gaz-near-postcode (zero-filled clues degrade country recall and fake an affix crash)."
15
15
  },
16
16
  "architecture": {
17
17
  "hidden_size": 384,
@@ -79,19 +79,75 @@
79
79
  "intersection_a",
80
80
  "intersection_b"
81
81
  ],
82
- "notes": "v0.6.0 \u2014 Stage 3 ships. Schema expanded from 10 to 16 tags / 21 to 33 BIO labels. STAGE2 label IDs preserved exactly (new tags at IDs 21-32). TIGER, NAD, and BAN adapters now emit street_prefix/street/street_suffix/unit from existing structured input. New synth-po-box corpus source provides 50K PO box training examples across en-US/CA/GB/AU, fr-FR/CA, es-ES/MX/AR.",
82
+ "notes": "v4.1.0 secondary-unit coverage. Same Stage-3 33-BIO-label schema as 4.0.0 (no schema change). Adds a format-diverse synth-unit shard (USPS Pub-28 C2 designators: APT/STE/FL/… across unit-after, unit-first, bare, and venue-prefixed layouts) on top of the v0.9.3 multi-locale base. `unit` recognition 0%→92.3% on a held-out real-designator eval; by 'negative space' it also raised US `street` +3.3pp and lifted `country` (US +6pp, FR +15pp) — covering the missing tag sharpened its neighbors. No regression vs 4.0.0 on any US/FR golden tag; DE native-order locality held (90.6%).",
83
83
  "format": {
84
84
  "model": "ONNX int8 dynamic (quantized from fp32)",
85
85
  "tokenizer": "SentencePiece unigram, byte_fallback=true, vocab_size=48000",
86
86
  "max_sequence_length": 128,
87
87
  "opset": 17,
88
- "fp32_size_mb": 111.8,
89
- "int8_size_mb": 28.1
88
+ "fp32_size_mb": 112.9,
89
+ "int8_size_mb": 28.6
90
90
  },
91
91
  "files": {
92
92
  "model": "model.onnx",
93
93
  "tokenizer": "tokenizer.model",
94
- "model_card": "model-card.json"
94
+ "model_card": "model-card.json",
95
+ "calibration": "calibration.json",
96
+ "calibration_per_locale": "calibration-per-locale.json"
95
97
  },
96
- "base_relpath": "/data/output-v060/checkpoints/step-100000"
97
- }
98
+ "calibration": {
99
+ "method": "isotonic-regression (PAVA) over per-span softmax confidence; OPT-IN via core/decoder createCalibrator",
100
+ "held_out_ece_raw": 0.0673,
101
+ "held_out_ece_calibrated": 0.0035,
102
+ "note": "calibration.json is the global table; calibration-per-locale.json carries per-locale tables (the global table under-serves DE/NL). Apply via @mailwoman/core/decoder's createCalibrator; default parse output is byte-stable when omitted."
103
+ },
104
+ "base_relpath": "/data/output-v097-unit-v3-s42/checkpoints/step-020000",
105
+ "eval": {
106
+ "ship_gate_2026_06_10": {
107
+ "honest_eval_vt": {
108
+ "n": 1428,
109
+ "region_match_pct": 99.9,
110
+ "coord_p50_km": 3.4,
111
+ "coord_p90_km": 7.4,
112
+ "pip_coverage_adj_pct": 47.1,
113
+ "baseline_v410_region_pct": 100.0,
114
+ "verdict": "PASS"
115
+ },
116
+ "demo_presets": "PASS — 5/6 identical to v4.1.0; 6th is the intended affix split",
117
+ "int8_vs_fp32": "PASS — all gate tags within 0.1pp; quant deterministic",
118
+ "de_native_order_int8_pct": 90.9
119
+ },
120
+ "per_component_int8_gazfed": {
121
+ "us": {
122
+ "postcode": 97.3,
123
+ "country_homograph": 89.8,
124
+ "micro": 84.8,
125
+ "locality": 72.9,
126
+ "region": 89.1,
127
+ "street": 76.2,
128
+ "street_prefix": 64.9,
129
+ "street_suffix": 48.8,
130
+ "unit": 90.6,
131
+ "house_number": 96.9
132
+ },
133
+ "fr": {
134
+ "postcode": 99.6,
135
+ "house_number": 94.6,
136
+ "region": 27.6
137
+ },
138
+ "de": {
139
+ "native_locality_anchor_on": 90.9
140
+ }
141
+ },
142
+ "known_regressions_vs_4_1_0": {
143
+ "us_street": -2.3,
144
+ "unit": -1.7,
145
+ "us_postcode": -1.0,
146
+ "mitigations": "arbitration layer #478; architecture escalation #492"
147
+ }
148
+ },
149
+ "files_md5": {
150
+ "model.onnx": "9eb4a99f6db06cccff57939f657c09f9",
151
+ "tokenizer.model": "b6137e8c52914c9715374268ecaa4bc6"
152
+ }
153
+ }
package/model.onnx CHANGED
Binary file
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@mailwoman/neural-weights-en-us",
3
- "version": "4.0.0",
3
+ "version": "4.2.0",
4
4
  "description": "Mailwoman neural-classifier weights for locale 'en-us'. Data-only package — loaded by @mailwoman/neural at runtime.",
5
5
  "license": "AGPL-3.0-only",
6
6
  "repository": {
@@ -11,6 +11,8 @@
11
11
  "model.onnx",
12
12
  "tokenizer.model",
13
13
  "model-card.json",
14
+ "calibration.json",
15
+ "calibration-per-locale.json",
14
16
  "README.md"
15
17
  ],
16
18
  "publishConfig": {