npm - @mailwoman/neural-weights-fr-fr - Versions diffs - 2.0.0 → 2.2.0 - Mend

@mailwoman/neural-weights-fr-fr 2.0.0 → 2.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/README.md CHANGED Viewed

@@ -1,30 +1,33 @@
 # @mailwoman/neural-weights-fr-fr
-Phase 2 / Stage 1 (coarse) Mailwoman neural-classifier weights.
+Stage 2 (coarse + venue/street/house_number) Mailwoman neural-classifier weights.
 - locale: **fr-fr**
-- corpus: **0.2.0**
-- training steps: **50000**
+- corpus: **0.3.0**
+- training steps: **2200**
 - hardware: **AMD Radeon 780M (gfx1103) bf16 ~14.6 GiB GTT**
-## Phase 2 §6 status
+## Per-component F1 targets
-**⚠ Below Phase 2 §6 targets (≥95% F1):**
+**⚠ Below per-component F1 targets:**
-- `country` F1 = **0.0000** (target ≥0.95)
-- `region` F1 = **0.8293** (target ≥0.95)
-- `locality` F1 = **0.6471** (target ≥0.95)
-- `postcode` F1 = **0.8594** (target ≥0.95)
+- `country` F1 = **0.2112** (target ≥0.95)
+- `region` F1 = **0.1883** (target ≥0.95)
+- `locality` F1 = **0.2736** (target ≥0.95)
+- `postcode` F1 = **0.6916** (target ≥0.95)
+- `venue` F1 = **0.3886** (target ≥0.60)
+- `street` F1 = **0.3016** (target ≥0.70)
+- `house_number` F1 = **0.7866** (target ≥0.80)
 ## Eval (golden set)
-- entries: **74**
-- full-parse exact match: **0.5270**
-- mean token confidence: **0.9745**
+- entries: **4535**
+- full-parse exact match: **0.0818**
+- mean token confidence: **0.8063**
 ## Components supported
-Stage 1 ships coarse-only: country / region / locality / dependent_locality / postcode / subregion / cedex. Street- and venue-level components are explicit future phases.
+Stage 2 ships coarse (country / region / locality / dependent_locality / postcode / subregion / cedex) plus fine-grained venue / street / house_number. Token classifier emits 21 BIO labels.
 ## Files

package/model-card.json CHANGED Viewed

@@ -1,53 +1,87 @@
 {
 	"name": "neural-weights-fr-fr",
-	"version": "0.2.0",
-	"phase": "Stage 1 (coarse)",
+	"version": "0.4.0",
+	"phase": "Stage 2 (coarse + venue/street/house_number)",
 	"license": "AGPL-3.0-only",
 	"locale": "fr-fr",
 	"training": {
-		"corpus_version": "0.2.0",
+		"corpus_version": "0.3.0",
 		"tokenizer_version": "0.1.0",
-		"steps": 50000,
+		"steps": 2200,
 		"hardware": "AMD Radeon 780M (gfx1103) bf16 ~14.6 GiB GTT",
-		"duration_seconds": 23520.0,
+		"duration_seconds": 1146.0,
 		"started_at": null,
-		"completed_at": "2026-05-18T21:33:27.380730Z"
+		"completed_at": "2026-05-23T06:21:51.190078Z"
 	},
-	"components_supported": ["country", "region", "locality", "dependent_locality", "postcode", "subregion", "cedex"],
+	"components_supported": [
+		"country",
+		"region",
+		"locality",
+		"dependent_locality",
+		"postcode",
+		"subregion",
+		"cedex",
+		"venue",
+		"street",
+		"house_number"
+	],
+	"labels": [
+		"O",
+		"B-country",
+		"I-country",
+		"B-region",
+		"I-region",
+		"B-locality",
+		"I-locality",
+		"B-dependent_locality",
+		"I-dependent_locality",
+		"B-postcode",
+		"I-postcode",
+		"B-subregion",
+		"I-subregion",
+		"B-cedex",
+		"I-cedex",
+		"B-venue",
+		"I-venue",
+		"B-street",
+		"I-street",
+		"B-house_number",
+		"I-house_number"
+	],
 	"eval": {
-		"n_entries": 74,
-		"full_parse_exact_match": 0.527027027027027,
-		"mean_token_confidence": 0.974534777700901,
+		"n_entries": 4535,
+		"full_parse_exact_match": 0.08180815876515987,
+		"mean_token_confidence": 0.8062812768727202,
 		"per_component": {
 			"country": {
-				"precision": 0.0,
-				"recall": 0.0,
-				"f1": 0.0,
-				"support": 6
+				"precision": 0.21428571428481394,
+				"recall": 0.20816326530527282,
+				"f1": 0.21118012372283307,
+				"support": 245
 			},
 			"region": {
-				"precision": 0.8499999999858334,
-				"recall": 0.80952380951096,
-				"f1": 0.8292682921697403,
-				"support": 63
+				"precision": 0.342951360263526,
+				"recall": 0.129797191887635,
+				"f1": 0.18832050661831204,
+				"support": 3205
 			},
 			"locality": {
-				"precision": 0.6874999999892578,
-				"recall": 0.6111111111026234,
-				"f1": 0.6470588230216262,
-				"support": 72
+				"precision": 0.24782398452605223,
+				"recall": 0.30533214179317686,
+				"f1": 0.2735886822759171,
+				"support": 3357
 			},
 			"dependent_locality": {
-				"precision": 0.0,
-				"recall": 0.0,
-				"f1": 0.0,
-				"support": 1
+				"precision": 0.005044136191670815,
+				"recall": 0.0999999999975,
+				"f1": 0.009603841445164863,
+				"support": 40
 			},
 			"postcode": {
-				"precision": 0.8730158730020157,
-				"recall": 0.8461538461408283,
-				"f1": 0.8593749994866943,
-				"support": 65
+				"precision": 0.8323890462696731,
+				"recall": 0.591610738254835,
+				"f1": 0.6916437813892687,
+				"support": 2980
 			},
 			"subregion": {
 				"precision": 0.0,
@@ -60,6 +94,24 @@
 				"recall": 0.0,
 				"f1": 0.0,
 				"support": 1
+			},
+			"venue": {
+				"precision": 0.37649063032335905,
+				"recall": 0.4014532243411431,
+				"f1": 0.38857142807160183,
+				"support": 1101
+			},
+			"street": {
+				"precision": 0.35594795539016916,
+				"recall": 0.26161202185783416,
+				"f1": 0.3015748026611547,
+				"support": 2928
+			},
+			"house_number": {
+				"precision": 0.7446153846150028,
+				"recall": 0.8335246842704744,
+				"f1": 0.7865655466300883,
+				"support": 1742
 			}
 		},
 		"calibration": [
@@ -72,56 +124,56 @@
 			{
 				"low": 0.1,
 				"high": 0.2,
-				"n": 0,
-				"acc": 0.0
+				"n": 21,
+				"acc": 0.23809523809523808
 			},
 			{
 				"low": 0.2,
 				"high": 0.3,
-				"n": 0,
-				"acc": 0.0
+				"n": 666,
+				"acc": 0.2912912912912913
 			},
 			{
 				"low": 0.3,
 				"high": 0.4,
-				"n": 5,
-				"acc": 0.2
+				"n": 2416,
+				"acc": 0.3265728476821192
 			},
 			{
 				"low": 0.4,
 				"high": 0.5,
-				"n": 9,
-				"acc": 0.4444444444444444
+				"n": 4308,
+				"acc": 0.3152274837511606
 			},
 			{
 				"low": 0.5,
 				"high": 0.6,
-				"n": 20,
-				"acc": 0.4
+				"n": 4777,
+				"acc": 0.3382876282185472
 			},
 			{
 				"low": 0.6,
 				"high": 0.7,
-				"n": 8,
-				"acc": 0.5
+				"n": 4943,
+				"acc": 0.3568682986040866
 			},
 			{
 				"low": 0.7,
 				"high": 0.8,
-				"n": 19,
-				"acc": 0.3684210526315789
+				"n": 5534,
+				"acc": 0.382544271774485
 			},
 			{
 				"low": 0.8,
 				"high": 0.9,
-				"n": 25,
-				"acc": 0.4
+				"n": 8066,
+				"acc": 0.43627572526655095
 			},
 			{
 				"low": 0.9,
 				"high": 1.0,
-				"n": 1114,
-				"acc": 0.8824057450628366
+				"n": 30517,
+				"acc": 0.6440344725890488
 			}
 		]
 	},
@@ -130,7 +182,7 @@
 		"particle-honorific kryptonite (e.g. FR 'Saint-Just-Saint-Rambert') if not in synth set",
 		"non-Latin scripts (CJK, Cyrillic) fall through to byte-fallback tokens; F1 unknown"
 	],
-	"notes": "Stage 1 coarse v0.2.0 \u2014 same architecture as v0.1.0 (8.87M params, 6L/256H/4-heads), trained on the expanded corpus-v0.2.0 (262.7M aligned rows, 6 train sources) with the loader rewrite from issue #43 (source-weighted multinomial sampler + relaxed coarse filter). The v0.1.0 positional-heuristic overfit was driven by a strict country-tag gate that dropped ~94% of v0.2.0 before any source weighting; with the gate relaxed and the loader interleaving sources at the row level, the model now sees a fixed mix of ban/tiger/nppes/state-tx/wof-admin/wof-postalcode per batch instead of mono-source blocks. See evals/scores-by-version.json for the v0.1.0 \u2192 v0.2.0 deltas.",
+	"notes": "v0.4.0 \u2014 issue #116. Same encoder geometry as v0.3.0 (8.87M params, 6L/256H/4-heads, 21 BIO labels, linear-chain CRF). Issue proposed (1) per-token CRF NLL normalization + (3) class-weighted CE biased toward coarse labels + (4) source-weight rebalance. Empirical iteration found that \u00a71 and \u00a73 destabilize sustained training at every LR tested (5e-4, 3e-4, 1.5e-4 \u2014 even the v0.3.0-safe LR), and on the golden v0.1.2 eval (4535 entries) they slightly REGRESS country/postcode F1 vs v0.3.0. SHIPPED recipe is the \u00a74-only ablation (v0.3.0 dual-loss + v0.4.0 source-weight rebalance) at lr=1.5e-4, step 2200. Modest fine-label gains (street +0.03, house_number +0.01), modest coarse-F1 regression (country -0.07, postcode -0.07). \u00a71/\u00a73 deferred to v0.4.1 corpus-side investigation per issue's '2K divergence' clause. Full ablation matrix retrospective in LOG.md.",
 	"format": {
 		"model": "ONNX int8 dynamic",
 		"tokenizer": "SentencePiece unigram, byte_fallback=true, vocab_size=16000",
@@ -142,5 +194,5 @@
 		"tokenizer": "tokenizer.model",
 		"model_card": "model-card.json"
 	},
-	"base_relpath": "/data/models/checkpoints/stage1-coarse/step-050000"
+	"base_relpath": "/data/models/checkpoints/v0_4_0-stableLR-source-only/step-002200"
 }

package/model.onnx CHANGED Viewed

Binary file

package/package.json CHANGED Viewed

@@ -1,19 +1,19 @@
 {
- "name": "@mailwoman/neural-weights-fr-fr",
- "version": "2.0.0",
- "description": "Mailwoman neural-classifier weights for locale 'fr-fr'. Data-only package — loaded by @mailwoman/neural at runtime.",
- "license": "AGPL-3.0-only",
- "repository": {
-  "type": "git",
-  "url": "https://github.com/sister-software/mailwoman"
- },
- "files": [
-  "model.onnx",
-  "tokenizer.model",
-  "model-card.json",
-  "README.md"
- ],
- "publishConfig": {
-  "access": "public"
- }
-}
+  "name": "@mailwoman/neural-weights-fr-fr",
+  "version": "2.2.0",
+  "description": "Mailwoman neural-classifier weights for locale 'fr-fr'. Data-only package — loaded by @mailwoman/neural at runtime.",
+  "license": "AGPL-3.0-only",
+  "repository": {
+    "type": "git",
+    "url": "https://github.com/sister-software/mailwoman"
+  },
+  "files": [
+    "model.onnx",
+    "tokenizer.model",
+    "model-card.json",
+    "README.md"
+  ],
+  "publishConfig": {
+    "access": "public"
+  }
+}

package/tokenizer.model CHANGED Viewed

Binary file