@mailwoman/core 2.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/data/chromium-i18n/ssl-address/AC.json +8 -0
- package/data/chromium-i18n/ssl-address/AD.json +16 -0
- package/data/chromium-i18n/ssl-address/AE.json +15 -0
- package/data/chromium-i18n/ssl-address/AF.json +8 -0
- package/data/chromium-i18n/ssl-address/AG.json +1 -0
- package/data/chromium-i18n/ssl-address/AI.json +8 -0
- package/data/chromium-i18n/ssl-address/AL.json +8 -0
- package/data/chromium-i18n/ssl-address/AM.json +16 -0
- package/data/chromium-i18n/ssl-address/AO.json +1 -0
- package/data/chromium-i18n/ssl-address/AQ.json +1 -0
- package/data/chromium-i18n/ssl-address/AR.json +16 -0
- package/data/chromium-i18n/ssl-address/AS.json +13 -0
- package/data/chromium-i18n/ssl-address/AT.json +10 -0
- package/data/chromium-i18n/ssl-address/AU.json +20 -0
- package/data/chromium-i18n/ssl-address/AW.json +1 -0
- package/data/chromium-i18n/ssl-address/AX.json +11 -0
- package/data/chromium-i18n/ssl-address/AZ.json +9 -0
- package/data/chromium-i18n/ssl-address/BA.json +8 -0
- package/data/chromium-i18n/ssl-address/BB.json +9 -0
- package/data/chromium-i18n/ssl-address/BD.json +9 -0
- package/data/chromium-i18n/ssl-address/BE.json +10 -0
- package/data/chromium-i18n/ssl-address/BF.json +6 -0
- package/data/chromium-i18n/ssl-address/BG.json +9 -0
- package/data/chromium-i18n/ssl-address/BH.json +8 -0
- package/data/chromium-i18n/ssl-address/BI.json +1 -0
- package/data/chromium-i18n/ssl-address/BJ.json +1 -0
- package/data/chromium-i18n/ssl-address/BL.json +11 -0
- package/data/chromium-i18n/ssl-address/BM.json +9 -0
- package/data/chromium-i18n/ssl-address/BN.json +9 -0
- package/data/chromium-i18n/ssl-address/BO.json +1 -0
- package/data/chromium-i18n/ssl-address/BQ.json +1 -0
- package/data/chromium-i18n/ssl-address/BR.json +21 -0
- package/data/chromium-i18n/ssl-address/BS.json +12 -0
- package/data/chromium-i18n/ssl-address/BT.json +9 -0
- package/data/chromium-i18n/ssl-address/BV.json +1 -0
- package/data/chromium-i18n/ssl-address/BW.json +1 -0
- package/data/chromium-i18n/ssl-address/BY.json +9 -0
- package/data/chromium-i18n/ssl-address/BZ.json +1 -0
- package/data/chromium-i18n/ssl-address/CA.json +17 -0
- package/data/chromium-i18n/ssl-address/CC.json +9 -0
- package/data/chromium-i18n/ssl-address/CD.json +1 -0
- package/data/chromium-i18n/ssl-address/CF.json +1 -0
- package/data/chromium-i18n/ssl-address/CG.json +1 -0
- package/data/chromium-i18n/ssl-address/CH.json +12 -0
- package/data/chromium-i18n/ssl-address/CI.json +6 -0
- package/data/chromium-i18n/ssl-address/CK.json +1 -0
- package/data/chromium-i18n/ssl-address/CL.json +15 -0
- package/data/chromium-i18n/ssl-address/CM.json +1 -0
- package/data/chromium-i18n/ssl-address/CN.json +22 -0
- package/data/chromium-i18n/ssl-address/CO.json +11 -0
- package/data/chromium-i18n/ssl-address/CR.json +10 -0
- package/data/chromium-i18n/ssl-address/CU.json +12 -0
- package/data/chromium-i18n/ssl-address/CV.json +13 -0
- package/data/chromium-i18n/ssl-address/CW.json +1 -0
- package/data/chromium-i18n/ssl-address/CX.json +9 -0
- package/data/chromium-i18n/ssl-address/CY.json +8 -0
- package/data/chromium-i18n/ssl-address/CZ.json +10 -0
- package/data/chromium-i18n/ssl-address/DE.json +10 -0
- package/data/chromium-i18n/ssl-address/DJ.json +1 -0
- package/data/chromium-i18n/ssl-address/DK.json +10 -0
- package/data/chromium-i18n/ssl-address/DM.json +1 -0
- package/data/chromium-i18n/ssl-address/DO.json +9 -0
- package/data/chromium-i18n/ssl-address/DZ.json +8 -0
- package/data/chromium-i18n/ssl-address/EC.json +10 -0
- package/data/chromium-i18n/ssl-address/EE.json +9 -0
- package/data/chromium-i18n/ssl-address/EG.json +16 -0
- package/data/chromium-i18n/ssl-address/EH.json +8 -0
- package/data/chromium-i18n/ssl-address/ER.json +1 -0
- package/data/chromium-i18n/ssl-address/ES.json +16 -0
- package/data/chromium-i18n/ssl-address/ET.json +8 -0
- package/data/chromium-i18n/ssl-address/FI.json +11 -0
- package/data/chromium-i18n/ssl-address/FJ.json +1 -0
- package/data/chromium-i18n/ssl-address/FK.json +10 -0
- package/data/chromium-i18n/ssl-address/FM.json +13 -0
- package/data/chromium-i18n/ssl-address/FO.json +10 -0
- package/data/chromium-i18n/ssl-address/FR.json +11 -0
- package/data/chromium-i18n/ssl-address/GA.json +1 -0
- package/data/chromium-i18n/ssl-address/GB.json +12 -0
- package/data/chromium-i18n/ssl-address/GD.json +1 -0
- package/data/chromium-i18n/ssl-address/GE.json +9 -0
- package/data/chromium-i18n/ssl-address/GF.json +11 -0
- package/data/chromium-i18n/ssl-address/GG.json +11 -0
- package/data/chromium-i18n/ssl-address/GH.json +1 -0
- package/data/chromium-i18n/ssl-address/GI.json +9 -0
- package/data/chromium-i18n/ssl-address/GL.json +9 -0
- package/data/chromium-i18n/ssl-address/GM.json +1 -0
- package/data/chromium-i18n/ssl-address/GN.json +8 -0
- package/data/chromium-i18n/ssl-address/GP.json +11 -0
- package/data/chromium-i18n/ssl-address/GQ.json +1 -0
- package/data/chromium-i18n/ssl-address/GR.json +10 -0
- package/data/chromium-i18n/ssl-address/GS.json +10 -0
- package/data/chromium-i18n/ssl-address/GT.json +8 -0
- package/data/chromium-i18n/ssl-address/GU.json +12 -0
- package/data/chromium-i18n/ssl-address/GW.json +8 -0
- package/data/chromium-i18n/ssl-address/GY.json +1 -0
- package/data/chromium-i18n/ssl-address/HK.json +16 -0
- package/data/chromium-i18n/ssl-address/HM.json +9 -0
- package/data/chromium-i18n/ssl-address/HN.json +9 -0
- package/data/chromium-i18n/ssl-address/HR.json +10 -0
- package/data/chromium-i18n/ssl-address/HT.json +9 -0
- package/data/chromium-i18n/ssl-address/HU.json +11 -0
- package/data/chromium-i18n/ssl-address/ID.json +13 -0
- package/data/chromium-i18n/ssl-address/IE.json +16 -0
- package/data/chromium-i18n/ssl-address/IL.json +9 -0
- package/data/chromium-i18n/ssl-address/IM.json +11 -0
- package/data/chromium-i18n/ssl-address/IN.json +18 -0
- package/data/chromium-i18n/ssl-address/IO.json +10 -0
- package/data/chromium-i18n/ssl-address/IQ.json +10 -0
- package/data/chromium-i18n/ssl-address/IR.json +14 -0
- package/data/chromium-i18n/ssl-address/IS.json +9 -0
- package/data/chromium-i18n/ssl-address/IT.json +17 -0
- package/data/chromium-i18n/ssl-address/JE.json +11 -0
- package/data/chromium-i18n/ssl-address/JM.json +12 -0
- package/data/chromium-i18n/ssl-address/JO.json +8 -0
- package/data/chromium-i18n/ssl-address/JP.json +19 -0
- package/data/chromium-i18n/ssl-address/KE.json +8 -0
- package/data/chromium-i18n/ssl-address/KG.json +8 -0
- package/data/chromium-i18n/ssl-address/KH.json +8 -0
- package/data/chromium-i18n/ssl-address/KI.json +8 -0
- package/data/chromium-i18n/ssl-address/KM.json +1 -0
- package/data/chromium-i18n/ssl-address/KN.json +12 -0
- package/data/chromium-i18n/ssl-address/KP.json +12 -0
- package/data/chromium-i18n/ssl-address/KR.json +23 -0
- package/data/chromium-i18n/ssl-address/KW.json +8 -0
- package/data/chromium-i18n/ssl-address/KY.json +14 -0
- package/data/chromium-i18n/ssl-address/KZ.json +8 -0
- package/data/chromium-i18n/ssl-address/LA.json +8 -0
- package/data/chromium-i18n/ssl-address/LB.json +8 -0
- package/data/chromium-i18n/ssl-address/LC.json +1 -0
- package/data/chromium-i18n/ssl-address/LI.json +11 -0
- package/data/chromium-i18n/ssl-address/LK.json +9 -0
- package/data/chromium-i18n/ssl-address/LR.json +8 -0
- package/data/chromium-i18n/ssl-address/LS.json +8 -0
- package/data/chromium-i18n/ssl-address/LT.json +10 -0
- package/data/chromium-i18n/ssl-address/LU.json +11 -0
- package/data/chromium-i18n/ssl-address/LV.json +9 -0
- package/data/chromium-i18n/ssl-address/LY.json +1 -0
- package/data/chromium-i18n/ssl-address/MA.json +8 -0
- package/data/chromium-i18n/ssl-address/MC.json +9 -0
- package/data/chromium-i18n/ssl-address/MD.json +9 -0
- package/data/chromium-i18n/ssl-address/ME.json +8 -0
- package/data/chromium-i18n/ssl-address/MF.json +11 -0
- package/data/chromium-i18n/ssl-address/MG.json +8 -0
- package/data/chromium-i18n/ssl-address/MH.json +13 -0
- package/data/chromium-i18n/ssl-address/MK.json +8 -0
- package/data/chromium-i18n/ssl-address/ML.json +1 -0
- package/data/chromium-i18n/ssl-address/MM.json +8 -0
- package/data/chromium-i18n/ssl-address/MN.json +9 -0
- package/data/chromium-i18n/ssl-address/MO.json +8 -0
- package/data/chromium-i18n/ssl-address/MP.json +13 -0
- package/data/chromium-i18n/ssl-address/MQ.json +11 -0
- package/data/chromium-i18n/ssl-address/MR.json +1 -0
- package/data/chromium-i18n/ssl-address/MS.json +1 -0
- package/data/chromium-i18n/ssl-address/MT.json +10 -0
- package/data/chromium-i18n/ssl-address/MU.json +9 -0
- package/data/chromium-i18n/ssl-address/MV.json +9 -0
- package/data/chromium-i18n/ssl-address/MW.json +1 -0
- package/data/chromium-i18n/ssl-address/MX.json +20 -0
- package/data/chromium-i18n/ssl-address/MY.json +19 -0
- package/data/chromium-i18n/ssl-address/MZ.json +12 -0
- package/data/chromium-i18n/ssl-address/NA.json +1 -0
- package/data/chromium-i18n/ssl-address/NC.json +11 -0
- package/data/chromium-i18n/ssl-address/NE.json +8 -0
- package/data/chromium-i18n/ssl-address/NF.json +9 -0
- package/data/chromium-i18n/ssl-address/NG.json +15 -0
- package/data/chromium-i18n/ssl-address/NI.json +16 -0
- package/data/chromium-i18n/ssl-address/NL.json +10 -0
- package/data/chromium-i18n/ssl-address/NO.json +11 -0
- package/data/chromium-i18n/ssl-address/NP.json +9 -0
- package/data/chromium-i18n/ssl-address/NR.json +12 -0
- package/data/chromium-i18n/ssl-address/NU.json +1 -0
- package/data/chromium-i18n/ssl-address/NZ.json +10 -0
- package/data/chromium-i18n/ssl-address/OM.json +8 -0
- package/data/chromium-i18n/ssl-address/PA.json +7 -0
- package/data/chromium-i18n/ssl-address/PE.json +14 -0
- package/data/chromium-i18n/ssl-address/PF.json +11 -0
- package/data/chromium-i18n/ssl-address/PG.json +9 -0
- package/data/chromium-i18n/ssl-address/PH.json +15 -0
- package/data/chromium-i18n/ssl-address/PK.json +9 -0
- package/data/chromium-i18n/ssl-address/PL.json +10 -0
- package/data/chromium-i18n/ssl-address/PM.json +10 -0
- package/data/chromium-i18n/ssl-address/PN.json +10 -0
- package/data/chromium-i18n/ssl-address/PR.json +13 -0
- package/data/chromium-i18n/ssl-address/PS.json +1 -0
- package/data/chromium-i18n/ssl-address/PT.json +10 -0
- package/data/chromium-i18n/ssl-address/PW.json +13 -0
- package/data/chromium-i18n/ssl-address/PY.json +8 -0
- package/data/chromium-i18n/ssl-address/QA.json +1 -0
- package/data/chromium-i18n/ssl-address/RE.json +11 -0
- package/data/chromium-i18n/ssl-address/RO.json +10 -0
- package/data/chromium-i18n/ssl-address/RS.json +9 -0
- package/data/chromium-i18n/ssl-address/RU.json +20 -0
- package/data/chromium-i18n/ssl-address/RW.json +1 -0
- package/data/chromium-i18n/ssl-address/SA.json +8 -0
- package/data/chromium-i18n/ssl-address/SB.json +1 -0
- package/data/chromium-i18n/ssl-address/SC.json +8 -0
- package/data/chromium-i18n/ssl-address/SD.json +9 -0
- package/data/chromium-i18n/ssl-address/SE.json +12 -0
- package/data/chromium-i18n/ssl-address/SG.json +10 -0
- package/data/chromium-i18n/ssl-address/SH.json +10 -0
- package/data/chromium-i18n/ssl-address/SI.json +9 -0
- package/data/chromium-i18n/ssl-address/SJ.json +11 -0
- package/data/chromium-i18n/ssl-address/SK.json +10 -0
- package/data/chromium-i18n/ssl-address/SL.json +1 -0
- package/data/chromium-i18n/ssl-address/SM.json +10 -0
- package/data/chromium-i18n/ssl-address/SN.json +8 -0
- package/data/chromium-i18n/ssl-address/SO.json +15 -0
- package/data/chromium-i18n/ssl-address/SR.json +11 -0
- package/data/chromium-i18n/ssl-address/SS.json +1 -0
- package/data/chromium-i18n/ssl-address/ST.json +1 -0
- package/data/chromium-i18n/ssl-address/SV.json +17 -0
- package/data/chromium-i18n/ssl-address/SX.json +1 -0
- package/data/chromium-i18n/ssl-address/SY.json +6 -0
- package/data/chromium-i18n/ssl-address/SZ.json +10 -0
- package/data/chromium-i18n/ssl-address/TA.json +8 -0
- package/data/chromium-i18n/ssl-address/TC.json +10 -0
- package/data/chromium-i18n/ssl-address/TD.json +1 -0
- package/data/chromium-i18n/ssl-address/TF.json +1 -0
- package/data/chromium-i18n/ssl-address/TG.json +1 -0
- package/data/chromium-i18n/ssl-address/TH.json +16 -0
- package/data/chromium-i18n/ssl-address/TJ.json +8 -0
- package/data/chromium-i18n/ssl-address/TK.json +1 -0
- package/data/chromium-i18n/ssl-address/TL.json +1 -0
- package/data/chromium-i18n/ssl-address/TM.json +8 -0
- package/data/chromium-i18n/ssl-address/TN.json +9 -0
- package/data/chromium-i18n/ssl-address/TO.json +1 -0
- package/data/chromium-i18n/ssl-address/TR.json +16 -0
- package/data/chromium-i18n/ssl-address/TT.json +1 -0
- package/data/chromium-i18n/ssl-address/TV.json +12 -0
- package/data/chromium-i18n/ssl-address/TW.json +20 -0
- package/data/chromium-i18n/ssl-address/TZ.json +8 -0
- package/data/chromium-i18n/ssl-address/UA.json +19 -0
- package/data/chromium-i18n/ssl-address/UG.json +1 -0
- package/data/chromium-i18n/ssl-address/UM.json +13 -0
- package/data/chromium-i18n/ssl-address/US.json +20 -0
- package/data/chromium-i18n/ssl-address/UY.json +15 -0
- package/data/chromium-i18n/ssl-address/UZ.json +10 -0
- package/data/chromium-i18n/ssl-address/VA.json +8 -0
- package/data/chromium-i18n/ssl-address/VC.json +9 -0
- package/data/chromium-i18n/ssl-address/VE.json +16 -0
- package/data/chromium-i18n/ssl-address/VG.json +9 -0
- package/data/chromium-i18n/ssl-address/VI.json +13 -0
- package/data/chromium-i18n/ssl-address/VN.json +15 -0
- package/data/chromium-i18n/ssl-address/VU.json +1 -0
- package/data/chromium-i18n/ssl-address/WF.json +10 -0
- package/data/chromium-i18n/ssl-address/WS.json +1 -0
- package/data/chromium-i18n/ssl-address/XK.json +8 -0
- package/data/chromium-i18n/ssl-address/YE.json +1 -0
- package/data/chromium-i18n/ssl-address/YT.json +10 -0
- package/data/chromium-i18n/ssl-address/ZA.json +10 -0
- package/data/chromium-i18n/ssl-address/ZM.json +8 -0
- package/data/chromium-i18n/ssl-address/ZW.json +1 -0
- package/data/chromium-i18n/ssl-address-download.sh +15 -0
- package/data/internal/dictionaries/languages.csv +184 -0
- package/data/internal/dictionaries/libpostal/af/personal_titles.txt +2 -0
- package/data/internal/dictionaries/libpostal/all/surnames.txt +1 -0
- package/data/internal/dictionaries/libpostal/de/academic_degrees.txt +7 -0
- package/data/internal/dictionaries/libpostal/de/concatenated_suffixes_separable.txt +3 -0
- package/data/internal/dictionaries/libpostal/de/near.txt +2 -0
- package/data/internal/dictionaries/libpostal/de/place_names.txt +11 -0
- package/data/internal/dictionaries/libpostal/de/stopwords.txt +1 -0
- package/data/internal/dictionaries/libpostal/de/street_types.txt +2 -0
- package/data/internal/dictionaries/libpostal/en/place_names.txt +7 -0
- package/data/internal/dictionaries/libpostal/en/road_types.txt +18 -0
- package/data/internal/dictionaries/libpostal/en/street_names.txt +2 -0
- package/data/internal/dictionaries/libpostal/en/street_types.txt +16 -0
- package/data/internal/dictionaries/libpostal/en/unit_types_numbered.txt +3 -0
- package/data/internal/dictionaries/libpostal/es/street_types.txt +2 -0
- package/data/internal/dictionaries/libpostal/fr/personal_titles.txt +4 -0
- package/data/internal/dictionaries/libpostal/fr/stopwords.txt +2 -0
- package/data/internal/dictionaries/libpostal/fr/street_types.txt +5 -0
- package/data/internal/dictionaries/libpostal/it/street_types.txt +2 -0
- package/data/internal/dictionaries/libpostal/ko/street_types.txt +1 -0
- package/data/internal/dictionaries/libpostal/nb/concatenated_suffixes_inseparable.txt +40 -0
- package/data/internal/dictionaries/libpostal/nb/directionals.txt +8 -0
- package/data/internal/dictionaries/libpostal/nb/street_types.txt +36 -0
- package/data/internal/dictionaries/libpostal/nl/concatenated_suffixes_inseparable.txt +1 -0
- package/data/internal/dictionaries/libpostal/nl/concatenated_suffixes_separable.txt +8 -0
- package/data/internal/dictionaries/libpostal/nl/directionals.txt +4 -0
- package/data/internal/dictionaries/libpostal/nl/personal_suffixes.txt +4 -0
- package/data/internal/dictionaries/libpostal/nl/personal_titles.txt +43 -0
- package/data/internal/dictionaries/libpostal/pl/place_names.txt +1 -0
- package/data/internal/dictionaries/libpostal/pl/synonyms.txt +1 -0
- package/data/internal/dictionaries/libpostal/sv/concatenated_suffixes_separable.txt +1 -0
- package/data/internal/dictionaries/whosonfirst/locality/name:eng_x_preferred.txt +81 -0
- package/data/internal/dictionaries/whosonfirst/locality/name:fra_x_preferred.txt +2 -0
- package/data/internal/dictionaries/whosonfirst/region/name:eng_x_preferred.txt +2 -0
- package/data/libpostal/dictionaries/README.md +88 -0
- package/data/libpostal/dictionaries/af/ambiguous_expansions.txt +8 -0
- package/data/libpostal/dictionaries/af/concatenated_suffixes_inseparable.txt +1 -0
- package/data/libpostal/dictionaries/af/concatenated_suffixes_separable.txt +14 -0
- package/data/libpostal/dictionaries/af/directionals.txt +12 -0
- package/data/libpostal/dictionaries/af/personal_titles.txt +23 -0
- package/data/libpostal/dictionaries/af/place_names.txt +2 -0
- package/data/libpostal/dictionaries/af/qualifiers.txt +4 -0
- package/data/libpostal/dictionaries/af/stopwords.txt +38 -0
- package/data/libpostal/dictionaries/af/street_types.txt +21 -0
- package/data/libpostal/dictionaries/all/ambiguous_expansions.txt +1 -0
- package/data/libpostal/dictionaries/all/chains.txt +504 -0
- package/data/libpostal/dictionaries/all/given_names.txt +12715 -0
- package/data/libpostal/dictionaries/all/people.txt +5 -0
- package/data/libpostal/dictionaries/all/surnames.txt +49375 -0
- package/data/libpostal/dictionaries/ar/personal_titles.txt +4 -0
- package/data/libpostal/dictionaries/ar/place_names.txt +1 -0
- package/data/libpostal/dictionaries/ar/street_types.txt +11 -0
- package/data/libpostal/dictionaries/ast/ambiguous_expansions.txt +1 -0
- package/data/libpostal/dictionaries/ast/personal_titles.txt +1 -0
- package/data/libpostal/dictionaries/ast/street_types.txt +3 -0
- package/data/libpostal/dictionaries/az/building_types.txt +1 -0
- package/data/libpostal/dictionaries/az/directionals.txt +8 -0
- package/data/libpostal/dictionaries/az/personal_titles.txt +3 -0
- package/data/libpostal/dictionaries/az/place_names.txt +1 -0
- package/data/libpostal/dictionaries/az/street_types.txt +18 -0
- package/data/libpostal/dictionaries/be/ambiguous_expansions.txt +8 -0
- package/data/libpostal/dictionaries/be/building_types.txt +2 -0
- package/data/libpostal/dictionaries/be/chains.txt +8 -0
- package/data/libpostal/dictionaries/be/directionals.txt +25 -0
- package/data/libpostal/dictionaries/be/house_numbers.txt +2 -0
- package/data/libpostal/dictionaries/be/personal_titles.txt +6 -0
- package/data/libpostal/dictionaries/be/qualifiers.txt +20 -0
- package/data/libpostal/dictionaries/be/street_types.txt +28 -0
- package/data/libpostal/dictionaries/be/unit_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/bg/ambiguous_expansions.txt +2 -0
- package/data/libpostal/dictionaries/bg/cross_streets.txt +10 -0
- package/data/libpostal/dictionaries/bg/directionals.txt +8 -0
- package/data/libpostal/dictionaries/bg/entrances.txt +2 -0
- package/data/libpostal/dictionaries/bg/level_types_numbered.txt +6 -0
- package/data/libpostal/dictionaries/bg/level_types_standalone.txt +4 -0
- package/data/libpostal/dictionaries/bg/near.txt +20 -0
- package/data/libpostal/dictionaries/bg/number.txt +2 -0
- package/data/libpostal/dictionaries/bg/personal_titles.txt +14 -0
- package/data/libpostal/dictionaries/bg/place_names.txt +6 -0
- package/data/libpostal/dictionaries/bg/post_office.txt +2 -0
- package/data/libpostal/dictionaries/bg/qualifiers.txt +10 -0
- package/data/libpostal/dictionaries/bg/staircases.txt +2 -0
- package/data/libpostal/dictionaries/bg/street_types.txt +6 -0
- package/data/libpostal/dictionaries/bg/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/bg/unit_types_numbered.txt +6 -0
- package/data/libpostal/dictionaries/br/personal_titles.txt +3 -0
- package/data/libpostal/dictionaries/br/place_names.txt +3 -0
- package/data/libpostal/dictionaries/br/qualifiers.txt +1 -0
- package/data/libpostal/dictionaries/br/stopwords.txt +4 -0
- package/data/libpostal/dictionaries/br/street_types.txt +40 -0
- package/data/libpostal/dictionaries/bs/ambiguous_expansions.txt +5 -0
- package/data/libpostal/dictionaries/bs/building_types.txt +1 -0
- package/data/libpostal/dictionaries/bs/cross_streets.txt +6 -0
- package/data/libpostal/dictionaries/bs/directionals.txt +4 -0
- package/data/libpostal/dictionaries/bs/entrances.txt +1 -0
- package/data/libpostal/dictionaries/bs/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/bs/level_types_mezzanine.txt +1 -0
- package/data/libpostal/dictionaries/bs/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/bs/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/bs/near.txt +5 -0
- package/data/libpostal/dictionaries/bs/no_number.txt +1 -0
- package/data/libpostal/dictionaries/bs/number.txt +1 -0
- package/data/libpostal/dictionaries/bs/personal_titles.txt +8 -0
- package/data/libpostal/dictionaries/bs/place_names.txt +9 -0
- package/data/libpostal/dictionaries/bs/post_office.txt +1 -0
- package/data/libpostal/dictionaries/bs/qualifiers.txt +2 -0
- package/data/libpostal/dictionaries/bs/staircases.txt +1 -0
- package/data/libpostal/dictionaries/bs/stopwords.txt +2 -0
- package/data/libpostal/dictionaries/bs/street_types.txt +12 -0
- package/data/libpostal/dictionaries/bs/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/bs/unit_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/ca/ambiguous_expansions.txt +9 -0
- package/data/libpostal/dictionaries/ca/cross_streets.txt +8 -0
- package/data/libpostal/dictionaries/ca/directionals.txt +9 -0
- package/data/libpostal/dictionaries/ca/elisions.txt +1 -0
- package/data/libpostal/dictionaries/ca/entrances.txt +1 -0
- package/data/libpostal/dictionaries/ca/given_names.txt +1 -0
- package/data/libpostal/dictionaries/ca/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/ca/level_types_mezzanine.txt +1 -0
- package/data/libpostal/dictionaries/ca/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/ca/level_types_standalone.txt +5 -0
- package/data/libpostal/dictionaries/ca/level_types_sub_basement.txt +1 -0
- package/data/libpostal/dictionaries/ca/near.txt +12 -0
- package/data/libpostal/dictionaries/ca/no_number.txt +1 -0
- package/data/libpostal/dictionaries/ca/number.txt +1 -0
- package/data/libpostal/dictionaries/ca/personal_titles.txt +10 -0
- package/data/libpostal/dictionaries/ca/place_names.txt +133 -0
- package/data/libpostal/dictionaries/ca/post_office.txt +1 -0
- package/data/libpostal/dictionaries/ca/postcodes.txt +1 -0
- package/data/libpostal/dictionaries/ca/qualifiers.txt +8 -0
- package/data/libpostal/dictionaries/ca/staircases.txt +1 -0
- package/data/libpostal/dictionaries/ca/stopwords.txt +31 -0
- package/data/libpostal/dictionaries/ca/street_types.txt +28 -0
- package/data/libpostal/dictionaries/ca/synonyms.txt +14 -0
- package/data/libpostal/dictionaries/ca/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/ca/unit_types_numbered.txt +10 -0
- package/data/libpostal/dictionaries/cs/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/cs/chains.txt +1 -0
- package/data/libpostal/dictionaries/cs/cross_streets.txt +9 -0
- package/data/libpostal/dictionaries/cs/directionals.txt +4 -0
- package/data/libpostal/dictionaries/cs/entrances.txt +1 -0
- package/data/libpostal/dictionaries/cs/house_numbers.txt +1 -0
- package/data/libpostal/dictionaries/cs/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/cs/level_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/cs/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/cs/near.txt +12 -0
- package/data/libpostal/dictionaries/cs/number.txt +1 -0
- package/data/libpostal/dictionaries/cs/personal_titles.txt +2 -0
- package/data/libpostal/dictionaries/cs/place_names.txt +47 -0
- package/data/libpostal/dictionaries/cs/post_office.txt +1 -0
- package/data/libpostal/dictionaries/cs/staircases.txt +1 -0
- package/data/libpostal/dictionaries/cs/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/cs/street_types.txt +6 -0
- package/data/libpostal/dictionaries/cs/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/cs/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/cy/building_types.txt +5 -0
- package/data/libpostal/dictionaries/cy/directionals.txt +4 -0
- package/data/libpostal/dictionaries/cy/personal_titles.txt +2 -0
- package/data/libpostal/dictionaries/cy/place_names.txt +22 -0
- package/data/libpostal/dictionaries/cy/qualifiers.txt +2 -0
- package/data/libpostal/dictionaries/cy/stopwords.txt +3 -0
- package/data/libpostal/dictionaries/cy/street_types.txt +22 -0
- package/data/libpostal/dictionaries/da/academic_degrees.txt +1 -0
- package/data/libpostal/dictionaries/da/ambiguous_expansions.txt +7 -0
- package/data/libpostal/dictionaries/da/building_types.txt +3 -0
- package/data/libpostal/dictionaries/da/concatenated_suffixes_inseparable.txt +21 -0
- package/data/libpostal/dictionaries/da/concatenated_suffixes_separable.txt +9 -0
- package/data/libpostal/dictionaries/da/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/da/directionals.txt +13 -0
- package/data/libpostal/dictionaries/da/entrances.txt +1 -0
- package/data/libpostal/dictionaries/da/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/da/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/da/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/da/near.txt +14 -0
- package/data/libpostal/dictionaries/da/number.txt +1 -0
- package/data/libpostal/dictionaries/da/personal_titles.txt +1 -0
- package/data/libpostal/dictionaries/da/place_names.txt +7 -0
- package/data/libpostal/dictionaries/da/post_office.txt +2 -0
- package/data/libpostal/dictionaries/da/staircases.txt +2 -0
- package/data/libpostal/dictionaries/da/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/da/street_types.txt +38 -0
- package/data/libpostal/dictionaries/da/synonyms.txt +2 -0
- package/data/libpostal/dictionaries/da/unit_directions.txt +3 -0
- package/data/libpostal/dictionaries/da/unit_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/de/academic_degrees.txt +5 -0
- package/data/libpostal/dictionaries/de/ambiguous_expansions.txt +18 -0
- package/data/libpostal/dictionaries/de/chains.txt +11 -0
- package/data/libpostal/dictionaries/de/company_types.txt +8 -0
- package/data/libpostal/dictionaries/de/concatenated_prefixes_separable.txt +17 -0
- package/data/libpostal/dictionaries/de/concatenated_suffixes_inseparable.txt +5 -0
- package/data/libpostal/dictionaries/de/concatenated_suffixes_separable.txt +16 -0
- package/data/libpostal/dictionaries/de/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/de/directionals.txt +41 -0
- package/data/libpostal/dictionaries/de/entrances.txt +1 -0
- package/data/libpostal/dictionaries/de/house_numbers.txt +1 -0
- package/data/libpostal/dictionaries/de/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/de/level_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/de/level_types_standalone.txt +4 -0
- package/data/libpostal/dictionaries/de/near.txt +16 -0
- package/data/libpostal/dictionaries/de/number.txt +1 -0
- package/data/libpostal/dictionaries/de/personal_suffixes.txt +2 -0
- package/data/libpostal/dictionaries/de/personal_titles.txt +18 -0
- package/data/libpostal/dictionaries/de/place_names.txt +123 -0
- package/data/libpostal/dictionaries/de/post_office.txt +1 -0
- package/data/libpostal/dictionaries/de/qualifiers.txt +3 -0
- package/data/libpostal/dictionaries/de/staircases.txt +2 -0
- package/data/libpostal/dictionaries/de/stopwords.txt +39 -0
- package/data/libpostal/dictionaries/de/street_types.txt +36 -0
- package/data/libpostal/dictionaries/de/synonyms.txt +16 -0
- package/data/libpostal/dictionaries/de/toponyms.txt +28 -0
- package/data/libpostal/dictionaries/de/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/de/unit_types_numbered.txt +7 -0
- package/data/libpostal/dictionaries/el/ambiguous_expansions.txt +1 -0
- package/data/libpostal/dictionaries/el/building_types.txt +2 -0
- package/data/libpostal/dictionaries/el/entrances.txt +2 -0
- package/data/libpostal/dictionaries/el/given_names.txt +6 -0
- package/data/libpostal/dictionaries/el/level_types_basement.txt +2 -0
- package/data/libpostal/dictionaries/el/level_types_mezzanine.txt +2 -0
- package/data/libpostal/dictionaries/el/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/el/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/el/personal_titles.txt +12 -0
- package/data/libpostal/dictionaries/el/place_names.txt +18 -0
- package/data/libpostal/dictionaries/el/post_office.txt +2 -0
- package/data/libpostal/dictionaries/el/postcodes.txt +2 -0
- package/data/libpostal/dictionaries/el/qualifiers.txt +6 -0
- package/data/libpostal/dictionaries/el/staircases.txt +2 -0
- package/data/libpostal/dictionaries/el/street_types.txt +6 -0
- package/data/libpostal/dictionaries/el/synonyms.txt +41 -0
- package/data/libpostal/dictionaries/el/toponyms.txt +3 -0
- package/data/libpostal/dictionaries/el/unit_types_numbered.txt +6 -0
- package/data/libpostal/dictionaries/en/academic_degrees.txt +27 -0
- package/data/libpostal/dictionaries/en/ambiguous_expansions.txt +178 -0
- package/data/libpostal/dictionaries/en/building_types.txt +19 -0
- package/data/libpostal/dictionaries/en/chains.txt +6 -0
- package/data/libpostal/dictionaries/en/company_types.txt +61 -0
- package/data/libpostal/dictionaries/en/cross_streets.txt +9 -0
- package/data/libpostal/dictionaries/en/directionals.txt +20 -0
- package/data/libpostal/dictionaries/en/entrances.txt +1 -0
- package/data/libpostal/dictionaries/en/given_names.txt +2 -0
- package/data/libpostal/dictionaries/en/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/en/level_types_mezzanine.txt +5 -0
- package/data/libpostal/dictionaries/en/level_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/en/level_types_standalone.txt +12 -0
- package/data/libpostal/dictionaries/en/level_types_sub_basement.txt +1 -0
- package/data/libpostal/dictionaries/en/near.txt +7 -0
- package/data/libpostal/dictionaries/en/no_number.txt +1 -0
- package/data/libpostal/dictionaries/en/nulls.txt +2 -0
- package/data/libpostal/dictionaries/en/number.txt +1 -0
- package/data/libpostal/dictionaries/en/personal_suffixes.txt +2 -0
- package/data/libpostal/dictionaries/en/personal_titles.txt +80 -0
- package/data/libpostal/dictionaries/en/place_names.txt +315 -0
- package/data/libpostal/dictionaries/en/post_office.txt +16 -0
- package/data/libpostal/dictionaries/en/qualifiers.txt +5 -0
- package/data/libpostal/dictionaries/en/staircases.txt +3 -0
- package/data/libpostal/dictionaries/en/stopwords.txt +14 -0
- package/data/libpostal/dictionaries/en/street_names.txt +358 -0
- package/data/libpostal/dictionaries/en/street_types.txt +410 -0
- package/data/libpostal/dictionaries/en/synonyms.txt +53 -0
- package/data/libpostal/dictionaries/en/toponyms.txt +80 -0
- package/data/libpostal/dictionaries/en/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/en/unit_types_numbered.txt +69 -0
- package/data/libpostal/dictionaries/en/unit_types_standalone.txt +16 -0
- package/data/libpostal/dictionaries/es/academic_degrees.txt +2 -0
- package/data/libpostal/dictionaries/es/ambiguous_expansions.txt +45 -0
- package/data/libpostal/dictionaries/es/building_types.txt +15 -0
- package/data/libpostal/dictionaries/es/company_types.txt +49 -0
- package/data/libpostal/dictionaries/es/cross_streets.txt +9 -0
- package/data/libpostal/dictionaries/es/directionals.txt +13 -0
- package/data/libpostal/dictionaries/es/entrances.txt +3 -0
- package/data/libpostal/dictionaries/es/given_names.txt +3 -0
- package/data/libpostal/dictionaries/es/house_numbers.txt +2 -0
- package/data/libpostal/dictionaries/es/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/es/level_types_mezzanine.txt +1 -0
- package/data/libpostal/dictionaries/es/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/es/level_types_standalone.txt +7 -0
- package/data/libpostal/dictionaries/es/level_types_sub_basement.txt +1 -0
- package/data/libpostal/dictionaries/es/near.txt +10 -0
- package/data/libpostal/dictionaries/es/no_number.txt +1 -0
- package/data/libpostal/dictionaries/es/number.txt +1 -0
- package/data/libpostal/dictionaries/es/personal_suffixes.txt +1 -0
- package/data/libpostal/dictionaries/es/personal_titles.txt +132 -0
- package/data/libpostal/dictionaries/es/place_names.txt +234 -0
- package/data/libpostal/dictionaries/es/post_office.txt +4 -0
- package/data/libpostal/dictionaries/es/postcodes.txt +1 -0
- package/data/libpostal/dictionaries/es/qualifiers.txt +34 -0
- package/data/libpostal/dictionaries/es/staircases.txt +2 -0
- package/data/libpostal/dictionaries/es/stopwords.txt +29 -0
- package/data/libpostal/dictionaries/es/street_types.txt +109 -0
- package/data/libpostal/dictionaries/es/surnames.txt +6 -0
- package/data/libpostal/dictionaries/es/synonyms.txt +58 -0
- package/data/libpostal/dictionaries/es/toponyms.txt +39 -0
- package/data/libpostal/dictionaries/es/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/es/unit_types_numbered.txt +15 -0
- package/data/libpostal/dictionaries/es/unit_types_standalone.txt +5 -0
- package/data/libpostal/dictionaries/et/ambiguous_expansions.txt +5 -0
- package/data/libpostal/dictionaries/et/building_types.txt +3 -0
- package/data/libpostal/dictionaries/et/company_types.txt +10 -0
- package/data/libpostal/dictionaries/et/cross_streets.txt +4 -0
- package/data/libpostal/dictionaries/et/directionals.txt +9 -0
- package/data/libpostal/dictionaries/et/entrances.txt +1 -0
- package/data/libpostal/dictionaries/et/level_types_basement.txt +2 -0
- package/data/libpostal/dictionaries/et/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/et/near.txt +4 -0
- package/data/libpostal/dictionaries/et/number.txt +1 -0
- package/data/libpostal/dictionaries/et/personal_titles.txt +13 -0
- package/data/libpostal/dictionaries/et/place_names.txt +39 -0
- package/data/libpostal/dictionaries/et/post_office.txt +2 -0
- package/data/libpostal/dictionaries/et/qualifiers.txt +6 -0
- package/data/libpostal/dictionaries/et/staircases.txt +1 -0
- package/data/libpostal/dictionaries/et/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/et/street_types.txt +10 -0
- package/data/libpostal/dictionaries/et/toponyms.txt +1 -0
- package/data/libpostal/dictionaries/et/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/et/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/eu/ambiguous_expansions.txt +2 -0
- package/data/libpostal/dictionaries/eu/cross_streets.txt +4 -0
- package/data/libpostal/dictionaries/eu/entrances.txt +1 -0
- package/data/libpostal/dictionaries/eu/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/eu/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/eu/near.txt +5 -0
- package/data/libpostal/dictionaries/eu/no_number.txt +1 -0
- package/data/libpostal/dictionaries/eu/place_names.txt +63 -0
- package/data/libpostal/dictionaries/eu/post_office.txt +1 -0
- package/data/libpostal/dictionaries/eu/postcodes.txt +1 -0
- package/data/libpostal/dictionaries/eu/qualifiers.txt +2 -0
- package/data/libpostal/dictionaries/eu/staircases.txt +1 -0
- package/data/libpostal/dictionaries/eu/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/eu/street_types.txt +18 -0
- package/data/libpostal/dictionaries/eu/unit_directions.txt +3 -0
- package/data/libpostal/dictionaries/eu/unit_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/fa/personal_titles.txt +6 -0
- package/data/libpostal/dictionaries/fa/place_names.txt +3 -0
- package/data/libpostal/dictionaries/fa/street_types.txt +7 -0
- package/data/libpostal/dictionaries/fi/ambiguous_expansions.txt +5 -0
- package/data/libpostal/dictionaries/fi/building_types.txt +3 -0
- package/data/libpostal/dictionaries/fi/chains.txt +1 -0
- package/data/libpostal/dictionaries/fi/concatenated_suffixes_separable.txt +20 -0
- package/data/libpostal/dictionaries/fi/cross_streets.txt +3 -0
- package/data/libpostal/dictionaries/fi/directionals.txt +4 -0
- package/data/libpostal/dictionaries/fi/entrances.txt +1 -0
- package/data/libpostal/dictionaries/fi/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/fi/near.txt +5 -0
- package/data/libpostal/dictionaries/fi/number.txt +1 -0
- package/data/libpostal/dictionaries/fi/post_office.txt +1 -0
- package/data/libpostal/dictionaries/fi/qualifiers.txt +2 -0
- package/data/libpostal/dictionaries/fi/staircases.txt +1 -0
- package/data/libpostal/dictionaries/fi/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/fi/street_types.txt +20 -0
- package/data/libpostal/dictionaries/fi/synonyms.txt +1 -0
- package/data/libpostal/dictionaries/fi/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/fi/unit_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/fil/street_types.txt +3 -0
- package/data/libpostal/dictionaries/fr/ambiguous_expansions.txt +25 -0
- package/data/libpostal/dictionaries/fr/building_types.txt +4 -0
- package/data/libpostal/dictionaries/fr/chains.txt +2 -0
- package/data/libpostal/dictionaries/fr/company_types.txt +40 -0
- package/data/libpostal/dictionaries/fr/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/fr/directionals.txt +12 -0
- package/data/libpostal/dictionaries/fr/elisions.txt +9 -0
- package/data/libpostal/dictionaries/fr/entrances.txt +2 -0
- package/data/libpostal/dictionaries/fr/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/fr/level_types_mezzanine.txt +1 -0
- package/data/libpostal/dictionaries/fr/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/fr/level_types_standalone.txt +8 -0
- package/data/libpostal/dictionaries/fr/level_types_sub_basement.txt +1 -0
- package/data/libpostal/dictionaries/fr/near.txt +20 -0
- package/data/libpostal/dictionaries/fr/no_number.txt +1 -0
- package/data/libpostal/dictionaries/fr/number.txt +1 -0
- package/data/libpostal/dictionaries/fr/people.txt +1 -0
- package/data/libpostal/dictionaries/fr/personal_titles.txt +57 -0
- package/data/libpostal/dictionaries/fr/place_names.txt +147 -0
- package/data/libpostal/dictionaries/fr/post_office.txt +3 -0
- package/data/libpostal/dictionaries/fr/qualifiers.txt +19 -0
- package/data/libpostal/dictionaries/fr/staircases.txt +1 -0
- package/data/libpostal/dictionaries/fr/stopwords.txt +28 -0
- package/data/libpostal/dictionaries/fr/street_types.txt +165 -0
- package/data/libpostal/dictionaries/fr/synonyms.txt +14 -0
- package/data/libpostal/dictionaries/fr/toponyms.txt +13 -0
- package/data/libpostal/dictionaries/fr/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/fr/unit_types_numbered.txt +10 -0
- package/data/libpostal/dictionaries/ga/building_types.txt +16 -0
- package/data/libpostal/dictionaries/ga/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/ga/personal_titles.txt +1 -0
- package/data/libpostal/dictionaries/ga/place_names.txt +10 -0
- package/data/libpostal/dictionaries/ga/street_types.txt +95 -0
- package/data/libpostal/dictionaries/ga/unit_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/gd/building_types.txt +8 -0
- package/data/libpostal/dictionaries/gd/directionals.txt +6 -0
- package/data/libpostal/dictionaries/gd/place_names.txt +7 -0
- package/data/libpostal/dictionaries/gd/qualifiers.txt +1 -0
- package/data/libpostal/dictionaries/gd/stopwords.txt +2 -0
- package/data/libpostal/dictionaries/gd/street_types.txt +52 -0
- package/data/libpostal/dictionaries/gl/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/gl/directionals.txt +8 -0
- package/data/libpostal/dictionaries/gl/personal_titles.txt +2 -0
- package/data/libpostal/dictionaries/gl/stopwords.txt +39 -0
- package/data/libpostal/dictionaries/gl/street_types.txt +26 -0
- package/data/libpostal/dictionaries/gl/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/gsw/ambiguous_expansions.txt +1 -0
- package/data/libpostal/dictionaries/gsw/concatenated_suffixes_separable.txt +8 -0
- package/data/libpostal/dictionaries/gsw/street_types.txt +8 -0
- package/data/libpostal/dictionaries/he/entrances.txt +2 -0
- package/data/libpostal/dictionaries/he/level_types_basement.txt +2 -0
- package/data/libpostal/dictionaries/he/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/he/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/he/personal_titles.txt +2 -0
- package/data/libpostal/dictionaries/he/post_office.txt +2 -0
- package/data/libpostal/dictionaries/he/street_types.txt +8 -0
- package/data/libpostal/dictionaries/he/unit_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/hi/street_types.txt +3 -0
- package/data/libpostal/dictionaries/hr/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/hr/building_types.txt +1 -0
- package/data/libpostal/dictionaries/hr/cross_streets.txt +6 -0
- package/data/libpostal/dictionaries/hr/directionals.txt +4 -0
- package/data/libpostal/dictionaries/hr/entrances.txt +1 -0
- package/data/libpostal/dictionaries/hr/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/hr/level_types_mezzanine.txt +1 -0
- package/data/libpostal/dictionaries/hr/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/hr/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/hr/near.txt +5 -0
- package/data/libpostal/dictionaries/hr/no_number.txt +1 -0
- package/data/libpostal/dictionaries/hr/personal_titles.txt +6 -0
- package/data/libpostal/dictionaries/hr/place_names.txt +18 -0
- package/data/libpostal/dictionaries/hr/post_office.txt +1 -0
- package/data/libpostal/dictionaries/hr/qualifiers.txt +1 -0
- package/data/libpostal/dictionaries/hr/staircases.txt +1 -0
- package/data/libpostal/dictionaries/hr/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/hr/street_types.txt +12 -0
- package/data/libpostal/dictionaries/hr/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/hr/unit_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/hu/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/hu/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/hu/directionals.txt +8 -0
- package/data/libpostal/dictionaries/hu/level_types_basement.txt +4 -0
- package/data/libpostal/dictionaries/hu/level_types_mezzanine.txt +2 -0
- package/data/libpostal/dictionaries/hu/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/hu/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/hu/near.txt +3 -0
- package/data/libpostal/dictionaries/hu/number.txt +1 -0
- package/data/libpostal/dictionaries/hu/personal_titles.txt +1 -0
- package/data/libpostal/dictionaries/hu/post_office.txt +1 -0
- package/data/libpostal/dictionaries/hu/stopwords.txt +4 -0
- package/data/libpostal/dictionaries/hu/street_types.txt +21 -0
- package/data/libpostal/dictionaries/hu/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/hu/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/id/academic_degrees.txt +78 -0
- package/data/libpostal/dictionaries/id/ambiguous_expansions.txt +64 -0
- package/data/libpostal/dictionaries/id/building_types.txt +7 -0
- package/data/libpostal/dictionaries/id/chains.txt +5 -0
- package/data/libpostal/dictionaries/id/company_types.txt +15 -0
- package/data/libpostal/dictionaries/id/cross_streets.txt +6 -0
- package/data/libpostal/dictionaries/id/directionals.txt +9 -0
- package/data/libpostal/dictionaries/id/entrances.txt +3 -0
- package/data/libpostal/dictionaries/id/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/id/level_types_standalone.txt +3 -0
- package/data/libpostal/dictionaries/id/near.txt +3 -0
- package/data/libpostal/dictionaries/id/number.txt +1 -0
- package/data/libpostal/dictionaries/id/personal_titles.txt +34 -0
- package/data/libpostal/dictionaries/id/place_names.txt +145 -0
- package/data/libpostal/dictionaries/id/qualifiers.txt +13 -0
- package/data/libpostal/dictionaries/id/stopwords.txt +9 -0
- package/data/libpostal/dictionaries/id/street_types.txt +7 -0
- package/data/libpostal/dictionaries/id/synonyms.txt +22 -0
- package/data/libpostal/dictionaries/id/toponyms.txt +34 -0
- package/data/libpostal/dictionaries/id/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/id/unit_types_numbered.txt +16 -0
- package/data/libpostal/dictionaries/id/unit_types_standalone.txt +9 -0
- package/data/libpostal/dictionaries/is/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/is/concatenated_suffixes_inseparable.txt +29 -0
- package/data/libpostal/dictionaries/is/cross_streets.txt +4 -0
- package/data/libpostal/dictionaries/is/directionals.txt +4 -0
- package/data/libpostal/dictionaries/is/entrances.txt +1 -0
- package/data/libpostal/dictionaries/is/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/is/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/is/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/is/near.txt +6 -0
- package/data/libpostal/dictionaries/is/number.txt +1 -0
- package/data/libpostal/dictionaries/is/post_office.txt +1 -0
- package/data/libpostal/dictionaries/is/qualifiers.txt +2 -0
- package/data/libpostal/dictionaries/is/staircases.txt +1 -0
- package/data/libpostal/dictionaries/is/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/is/street_types.txt +29 -0
- package/data/libpostal/dictionaries/is/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/is/unit_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/it/academic_degrees.txt +1 -0
- package/data/libpostal/dictionaries/it/ambiguous_expansions.txt +8 -0
- package/data/libpostal/dictionaries/it/building_types.txt +5 -0
- package/data/libpostal/dictionaries/it/chains.txt +5 -0
- package/data/libpostal/dictionaries/it/company_types.txt +16 -0
- package/data/libpostal/dictionaries/it/cross_streets.txt +7 -0
- package/data/libpostal/dictionaries/it/directionals.txt +11 -0
- package/data/libpostal/dictionaries/it/elisions.txt +4 -0
- package/data/libpostal/dictionaries/it/entrances.txt +1 -0
- package/data/libpostal/dictionaries/it/level_types_basement.txt +2 -0
- package/data/libpostal/dictionaries/it/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/it/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/it/near.txt +10 -0
- package/data/libpostal/dictionaries/it/no_number.txt +2 -0
- package/data/libpostal/dictionaries/it/number.txt +1 -0
- package/data/libpostal/dictionaries/it/personal_titles.txt +72 -0
- package/data/libpostal/dictionaries/it/place_names.txt +203 -0
- package/data/libpostal/dictionaries/it/post_office.txt +2 -0
- package/data/libpostal/dictionaries/it/qualifiers.txt +16 -0
- package/data/libpostal/dictionaries/it/staircases.txt +1 -0
- package/data/libpostal/dictionaries/it/stopwords.txt +47 -0
- package/data/libpostal/dictionaries/it/street_types.txt +151 -0
- package/data/libpostal/dictionaries/it/synonyms.txt +115 -0
- package/data/libpostal/dictionaries/it/toponyms.txt +110 -0
- package/data/libpostal/dictionaries/it/unit_types_numbered.txt +9 -0
- package/data/libpostal/dictionaries/ja/ambiguous_expansions.txt +5 -0
- package/data/libpostal/dictionaries/ja/building_types.txt +6 -0
- package/data/libpostal/dictionaries/ja/chains.txt +27 -0
- package/data/libpostal/dictionaries/ja/directionals.txt +16 -0
- package/data/libpostal/dictionaries/ja/level_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/ja/number.txt +2 -0
- package/data/libpostal/dictionaries/ja/place_names.txt +16 -0
- package/data/libpostal/dictionaries/ja/post_office.txt +2 -0
- package/data/libpostal/dictionaries/ja/postcodes.txt +2 -0
- package/data/libpostal/dictionaries/ja/qualifiers.txt +38 -0
- package/data/libpostal/dictionaries/ja/street_types.txt +67 -0
- package/data/libpostal/dictionaries/ka/ambiguous_expansions.txt +2 -0
- package/data/libpostal/dictionaries/ka/personal_titles.txt +4 -0
- package/data/libpostal/dictionaries/ka/place_names.txt +7 -0
- package/data/libpostal/dictionaries/ka/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/ka/street_types.txt +12 -0
- package/data/libpostal/dictionaries/ko/directionals.txt +31 -0
- package/data/libpostal/dictionaries/ko/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/ko/number.txt +3 -0
- package/data/libpostal/dictionaries/ko/post_office.txt +2 -0
- package/data/libpostal/dictionaries/ko/postcodes.txt +2 -0
- package/data/libpostal/dictionaries/ko/qualifiers.txt +6 -0
- package/data/libpostal/dictionaries/ko/street_types.txt +8 -0
- package/data/libpostal/dictionaries/lb/concatenated_suffixes_separable.txt +3 -0
- package/data/libpostal/dictionaries/lb/street_types.txt +3 -0
- package/data/libpostal/dictionaries/lt/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/lt/building_types.txt +1 -0
- package/data/libpostal/dictionaries/lt/cross_streets.txt +4 -0
- package/data/libpostal/dictionaries/lt/directionals.txt +4 -0
- package/data/libpostal/dictionaries/lt/entrances.txt +1 -0
- package/data/libpostal/dictionaries/lt/level_types_basement.txt +2 -0
- package/data/libpostal/dictionaries/lt/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/lt/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/lt/number.txt +1 -0
- package/data/libpostal/dictionaries/lt/post_office.txt +1 -0
- package/data/libpostal/dictionaries/lt/qualifiers.txt +5 -0
- package/data/libpostal/dictionaries/lt/staircases.txt +1 -0
- package/data/libpostal/dictionaries/lt/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/lt/street_types.txt +7 -0
- package/data/libpostal/dictionaries/lt/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/lt/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/lv/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/lv/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/lv/directionals.txt +4 -0
- package/data/libpostal/dictionaries/lv/entrances.txt +1 -0
- package/data/libpostal/dictionaries/lv/level_types_basement.txt +2 -0
- package/data/libpostal/dictionaries/lv/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/lv/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/lv/number.txt +1 -0
- package/data/libpostal/dictionaries/lv/place_names.txt +2 -0
- package/data/libpostal/dictionaries/lv/staircases.txt +2 -0
- package/data/libpostal/dictionaries/lv/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/lv/street_types.txt +5 -0
- package/data/libpostal/dictionaries/lv/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/lv/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/ms/ambiguous_expansions.txt +1 -0
- package/data/libpostal/dictionaries/ms/building_types.txt +10 -0
- package/data/libpostal/dictionaries/ms/company_types.txt +8 -0
- package/data/libpostal/dictionaries/ms/directionals.txt +9 -0
- package/data/libpostal/dictionaries/ms/given_names.txt +3 -0
- package/data/libpostal/dictionaries/ms/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/ms/personal_titles.txt +92 -0
- package/data/libpostal/dictionaries/ms/place_names.txt +145 -0
- package/data/libpostal/dictionaries/ms/post_office.txt +3 -0
- package/data/libpostal/dictionaries/ms/qualifiers.txt +6 -0
- package/data/libpostal/dictionaries/ms/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/ms/street_types.txt +35 -0
- package/data/libpostal/dictionaries/ms/synonyms.txt +27 -0
- package/data/libpostal/dictionaries/mt/ambiguous_expansions.txt +1 -0
- package/data/libpostal/dictionaries/mt/number.txt +1 -0
- package/data/libpostal/dictionaries/mt/personal_titles.txt +6 -0
- package/data/libpostal/dictionaries/mt/place_names.txt +1 -0
- package/data/libpostal/dictionaries/mt/stopwords.txt +5 -0
- package/data/libpostal/dictionaries/mt/street_types.txt +6 -0
- package/data/libpostal/dictionaries/nb/ambiguous_expansions.txt +11 -0
- package/data/libpostal/dictionaries/nb/building_types.txt +3 -0
- package/data/libpostal/dictionaries/nb/concatenated_suffixes_inseparable.txt +13 -0
- package/data/libpostal/dictionaries/nb/concatenated_suffixes_separable.txt +6 -0
- package/data/libpostal/dictionaries/nb/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/nb/directionals.txt +13 -0
- package/data/libpostal/dictionaries/nb/entrances.txt +1 -0
- package/data/libpostal/dictionaries/nb/level_types_numbered.txt +5 -0
- package/data/libpostal/dictionaries/nb/near.txt +7 -0
- package/data/libpostal/dictionaries/nb/number.txt +1 -0
- package/data/libpostal/dictionaries/nb/personal_titles.txt +1 -0
- package/data/libpostal/dictionaries/nb/post_office.txt +1 -0
- package/data/libpostal/dictionaries/nb/staircases.txt +2 -0
- package/data/libpostal/dictionaries/nb/stopwords.txt +34 -0
- package/data/libpostal/dictionaries/nb/street_types.txt +20 -0
- package/data/libpostal/dictionaries/nb/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/nb/unit_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/nl/ambiguous_expansions.txt +10 -0
- package/data/libpostal/dictionaries/nl/building_types.txt +1 -0
- package/data/libpostal/dictionaries/nl/chains.txt +1 -0
- package/data/libpostal/dictionaries/nl/concatenated_suffixes_inseparable.txt +3 -0
- package/data/libpostal/dictionaries/nl/concatenated_suffixes_separable.txt +13 -0
- package/data/libpostal/dictionaries/nl/cross_streets.txt +4 -0
- package/data/libpostal/dictionaries/nl/directionals.txt +20 -0
- package/data/libpostal/dictionaries/nl/entrances.txt +1 -0
- package/data/libpostal/dictionaries/nl/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/nl/level_types_standalone.txt +5 -0
- package/data/libpostal/dictionaries/nl/near.txt +7 -0
- package/data/libpostal/dictionaries/nl/number.txt +1 -0
- package/data/libpostal/dictionaries/nl/personal_titles.txt +32 -0
- package/data/libpostal/dictionaries/nl/place_names.txt +81 -0
- package/data/libpostal/dictionaries/nl/post_office.txt +1 -0
- package/data/libpostal/dictionaries/nl/qualifiers.txt +4 -0
- package/data/libpostal/dictionaries/nl/staircases.txt +2 -0
- package/data/libpostal/dictionaries/nl/stopwords.txt +38 -0
- package/data/libpostal/dictionaries/nl/street_types.txt +22 -0
- package/data/libpostal/dictionaries/nl/synonyms.txt +2 -0
- package/data/libpostal/dictionaries/nl/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/nl/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/oc/elisions.txt +1 -0
- package/data/libpostal/dictionaries/oc/stopwords.txt +14 -0
- package/data/libpostal/dictionaries/oc/street_types.txt +5 -0
- package/data/libpostal/dictionaries/pap/personal_titles.txt +2 -0
- package/data/libpostal/dictionaries/pap/street_types.txt +2 -0
- package/data/libpostal/dictionaries/pl/academic_degrees.txt +2 -0
- package/data/libpostal/dictionaries/pl/ambiguous_expansions.txt +9 -0
- package/data/libpostal/dictionaries/pl/building_types.txt +1 -0
- package/data/libpostal/dictionaries/pl/chains.txt +3 -0
- package/data/libpostal/dictionaries/pl/company_types.txt +4 -0
- package/data/libpostal/dictionaries/pl/cross_streets.txt +6 -0
- package/data/libpostal/dictionaries/pl/directionals.txt +8 -0
- package/data/libpostal/dictionaries/pl/entrances.txt +1 -0
- package/data/libpostal/dictionaries/pl/house_numbers.txt +1 -0
- package/data/libpostal/dictionaries/pl/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/pl/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/pl/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/pl/near.txt +11 -0
- package/data/libpostal/dictionaries/pl/number.txt +1 -0
- package/data/libpostal/dictionaries/pl/personal_suffixes.txt +2 -0
- package/data/libpostal/dictionaries/pl/personal_titles.txt +54 -0
- package/data/libpostal/dictionaries/pl/place_names.txt +31 -0
- package/data/libpostal/dictionaries/pl/post_office.txt +1 -0
- package/data/libpostal/dictionaries/pl/qualifiers.txt +9 -0
- package/data/libpostal/dictionaries/pl/staircases.txt +1 -0
- package/data/libpostal/dictionaries/pl/stopwords.txt +3 -0
- package/data/libpostal/dictionaries/pl/street_types.txt +12 -0
- package/data/libpostal/dictionaries/pl/synonyms.txt +19 -0
- package/data/libpostal/dictionaries/pl/toponyms.txt +1 -0
- package/data/libpostal/dictionaries/pl/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/pl/unit_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/pt/ambiguous_expansions.txt +12 -0
- package/data/libpostal/dictionaries/pt/building_types.txt +7 -0
- package/data/libpostal/dictionaries/pt/company_types.txt +31 -0
- package/data/libpostal/dictionaries/pt/cross_streets.txt +8 -0
- package/data/libpostal/dictionaries/pt/directionals.txt +8 -0
- package/data/libpostal/dictionaries/pt/elisions.txt +1 -0
- package/data/libpostal/dictionaries/pt/entrances.txt +1 -0
- package/data/libpostal/dictionaries/pt/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/pt/level_types_mezzanine.txt +1 -0
- package/data/libpostal/dictionaries/pt/level_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/pt/level_types_standalone.txt +5 -0
- package/data/libpostal/dictionaries/pt/level_types_sub_basement.txt +1 -0
- package/data/libpostal/dictionaries/pt/near.txt +13 -0
- package/data/libpostal/dictionaries/pt/no_number.txt +1 -0
- package/data/libpostal/dictionaries/pt/number.txt +1 -0
- package/data/libpostal/dictionaries/pt/personal_suffixes.txt +3 -0
- package/data/libpostal/dictionaries/pt/personal_titles.txt +101 -0
- package/data/libpostal/dictionaries/pt/place_names.txt +52 -0
- package/data/libpostal/dictionaries/pt/post_office.txt +2 -0
- package/data/libpostal/dictionaries/pt/postcodes.txt +2 -0
- package/data/libpostal/dictionaries/pt/qualifiers.txt +8 -0
- package/data/libpostal/dictionaries/pt/staircases.txt +1 -0
- package/data/libpostal/dictionaries/pt/stopwords.txt +35 -0
- package/data/libpostal/dictionaries/pt/street_types.txt +53 -0
- package/data/libpostal/dictionaries/pt/synonyms.txt +21 -0
- package/data/libpostal/dictionaries/pt/toponyms.txt +28 -0
- package/data/libpostal/dictionaries/pt/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/pt/unit_types_numbered.txt +10 -0
- package/data/libpostal/dictionaries/pt/unit_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/ro/ambiguous_expansions.txt +5 -0
- package/data/libpostal/dictionaries/ro/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/ro/directionals.txt +4 -0
- package/data/libpostal/dictionaries/ro/entrances.txt +1 -0
- package/data/libpostal/dictionaries/ro/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/ro/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/ro/near.txt +7 -0
- package/data/libpostal/dictionaries/ro/no_number.txt +1 -0
- package/data/libpostal/dictionaries/ro/number.txt +1 -0
- package/data/libpostal/dictionaries/ro/personal_titles.txt +14 -0
- package/data/libpostal/dictionaries/ro/post_office.txt +1 -0
- package/data/libpostal/dictionaries/ro/qualifiers.txt +1 -0
- package/data/libpostal/dictionaries/ro/staircases.txt +1 -0
- package/data/libpostal/dictionaries/ro/stopwords.txt +2 -0
- package/data/libpostal/dictionaries/ro/street_types.txt +13 -0
- package/data/libpostal/dictionaries/ro/unit_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/ru/ambiguous_expansions.txt +18 -0
- package/data/libpostal/dictionaries/ru/building_types.txt +2 -0
- package/data/libpostal/dictionaries/ru/chains.txt +42 -0
- package/data/libpostal/dictionaries/ru/company_types.txt +9 -0
- package/data/libpostal/dictionaries/ru/cross_streets.txt +11 -0
- package/data/libpostal/dictionaries/ru/directionals.txt +16 -0
- package/data/libpostal/dictionaries/ru/entrances.txt +2 -0
- package/data/libpostal/dictionaries/ru/house_numbers.txt +2 -0
- package/data/libpostal/dictionaries/ru/level_types_basement.txt +4 -0
- package/data/libpostal/dictionaries/ru/level_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/ru/level_types_standalone.txt +4 -0
- package/data/libpostal/dictionaries/ru/near.txt +26 -0
- package/data/libpostal/dictionaries/ru/no_number.txt +1 -0
- package/data/libpostal/dictionaries/ru/number.txt +2 -0
- package/data/libpostal/dictionaries/ru/personal_titles.txt +6 -0
- package/data/libpostal/dictionaries/ru/place_names.txt +160 -0
- package/data/libpostal/dictionaries/ru/post_office.txt +2 -0
- package/data/libpostal/dictionaries/ru/qualifiers.txt +31 -0
- package/data/libpostal/dictionaries/ru/staircases.txt +2 -0
- package/data/libpostal/dictionaries/ru/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/ru/street_types.txt +28 -0
- package/data/libpostal/dictionaries/ru/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/ru/unit_types_numbered.txt +10 -0
- package/data/libpostal/dictionaries/si/place_names.txt +8 -0
- package/data/libpostal/dictionaries/si/qualifiers.txt +4 -0
- package/data/libpostal/dictionaries/si/street_types.txt +2 -0
- package/data/libpostal/dictionaries/sk/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/sk/cross_streets.txt +8 -0
- package/data/libpostal/dictionaries/sk/directionals.txt +21 -0
- package/data/libpostal/dictionaries/sk/entrances.txt +1 -0
- package/data/libpostal/dictionaries/sk/house_numbers.txt +1 -0
- package/data/libpostal/dictionaries/sk/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/sk/level_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/sk/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/sk/near.txt +13 -0
- package/data/libpostal/dictionaries/sk/number.txt +1 -0
- package/data/libpostal/dictionaries/sk/personal_titles.txt +16 -0
- package/data/libpostal/dictionaries/sk/place_names.txt +28 -0
- package/data/libpostal/dictionaries/sk/post_office.txt +1 -0
- package/data/libpostal/dictionaries/sk/qualifiers.txt +3 -0
- package/data/libpostal/dictionaries/sk/staircases.txt +1 -0
- package/data/libpostal/dictionaries/sk/stopwords.txt +29 -0
- package/data/libpostal/dictionaries/sk/street_types.txt +20 -0
- package/data/libpostal/dictionaries/sk/toponyms.txt +1 -0
- package/data/libpostal/dictionaries/sk/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/sk/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/sl/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/sl/chains.txt +1 -0
- package/data/libpostal/dictionaries/sl/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/sl/directionals.txt +4 -0
- package/data/libpostal/dictionaries/sl/entrances.txt +1 -0
- package/data/libpostal/dictionaries/sl/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/sl/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/sl/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/sl/near.txt +7 -0
- package/data/libpostal/dictionaries/sl/no_number.txt +1 -0
- package/data/libpostal/dictionaries/sl/number.txt +1 -0
- package/data/libpostal/dictionaries/sl/personal_titles.txt +3 -0
- package/data/libpostal/dictionaries/sl/place_names.txt +1 -0
- package/data/libpostal/dictionaries/sl/post_office.txt +1 -0
- package/data/libpostal/dictionaries/sl/staircases.txt +1 -0
- package/data/libpostal/dictionaries/sl/stopwords.txt +7 -0
- package/data/libpostal/dictionaries/sl/street_types.txt +4 -0
- package/data/libpostal/dictionaries/sl/synonyms.txt +13 -0
- package/data/libpostal/dictionaries/sl/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/sl/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/sr/ambiguous_expansions.txt +9 -0
- package/data/libpostal/dictionaries/sr/cross_streets.txt +10 -0
- package/data/libpostal/dictionaries/sr/directionals.txt +8 -0
- package/data/libpostal/dictionaries/sr/entrances.txt +2 -0
- package/data/libpostal/dictionaries/sr/level_types_basement.txt +2 -0
- package/data/libpostal/dictionaries/sr/level_types_numbered.txt +6 -0
- package/data/libpostal/dictionaries/sr/level_types_standalone.txt +4 -0
- package/data/libpostal/dictionaries/sr/number.txt +2 -0
- package/data/libpostal/dictionaries/sr/personal_titles.txt +14 -0
- package/data/libpostal/dictionaries/sr/place_names.txt +12 -0
- package/data/libpostal/dictionaries/sr/post_office.txt +6 -0
- package/data/libpostal/dictionaries/sr/staircases.txt +2 -0
- package/data/libpostal/dictionaries/sr/stopwords.txt +2 -0
- package/data/libpostal/dictionaries/sr/street_types.txt +17 -0
- package/data/libpostal/dictionaries/sr/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/sr/unit_types_numbered.txt +8 -0
- package/data/libpostal/dictionaries/sv/ambiguous_expansions.txt +9 -0
- package/data/libpostal/dictionaries/sv/company_types.txt +4 -0
- package/data/libpostal/dictionaries/sv/concatenated_suffixes_inseparable.txt +5 -0
- package/data/libpostal/dictionaries/sv/concatenated_suffixes_separable.txt +8 -0
- package/data/libpostal/dictionaries/sv/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/sv/directionals.txt +8 -0
- package/data/libpostal/dictionaries/sv/entrances.txt +2 -0
- package/data/libpostal/dictionaries/sv/level_types_numbered.txt +7 -0
- package/data/libpostal/dictionaries/sv/level_types_standalone.txt +5 -0
- package/data/libpostal/dictionaries/sv/near.txt +11 -0
- package/data/libpostal/dictionaries/sv/number.txt +1 -0
- package/data/libpostal/dictionaries/sv/personal_titles.txt +3 -0
- package/data/libpostal/dictionaries/sv/post_office.txt +2 -0
- package/data/libpostal/dictionaries/sv/staircases.txt +3 -0
- package/data/libpostal/dictionaries/sv/stopwords.txt +25 -0
- package/data/libpostal/dictionaries/sv/street_types.txt +13 -0
- package/data/libpostal/dictionaries/sv/synonyms.txt +4 -0
- package/data/libpostal/dictionaries/sv/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/sv/unit_types_numbered.txt +5 -0
- package/data/libpostal/dictionaries/th/chains.txt +2 -0
- package/data/libpostal/dictionaries/th/street_types.txt +10 -0
- package/data/libpostal/dictionaries/tr/ambiguous_expansions.txt +5 -0
- package/data/libpostal/dictionaries/tr/chains.txt +1 -0
- package/data/libpostal/dictionaries/tr/cross_streets.txt +4 -0
- package/data/libpostal/dictionaries/tr/directionals.txt +4 -0
- package/data/libpostal/dictionaries/tr/entrances.txt +1 -0
- package/data/libpostal/dictionaries/tr/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/tr/level_types_mezzanine.txt +1 -0
- package/data/libpostal/dictionaries/tr/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/tr/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/tr/number.txt +2 -0
- package/data/libpostal/dictionaries/tr/personal_titles.txt +4 -0
- package/data/libpostal/dictionaries/tr/place_names.txt +2 -0
- package/data/libpostal/dictionaries/tr/post_office.txt +1 -0
- package/data/libpostal/dictionaries/tr/qualifiers.txt +5 -0
- package/data/libpostal/dictionaries/tr/staircases.txt +1 -0
- package/data/libpostal/dictionaries/tr/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/tr/street_types.txt +10 -0
- package/data/libpostal/dictionaries/tr/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/tr/unit_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/uk/ambiguous_expansions.txt +8 -0
- package/data/libpostal/dictionaries/uk/chains.txt +7 -0
- package/data/libpostal/dictionaries/uk/cross_streets.txt +10 -0
- package/data/libpostal/dictionaries/uk/directionals.txt +8 -0
- package/data/libpostal/dictionaries/uk/entrances.txt +2 -0
- package/data/libpostal/dictionaries/uk/house_numbers.txt +4 -0
- package/data/libpostal/dictionaries/uk/level_types_basement.txt +4 -0
- package/data/libpostal/dictionaries/uk/level_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/uk/level_types_standalone.txt +4 -0
- package/data/libpostal/dictionaries/uk/near.txt +24 -0
- package/data/libpostal/dictionaries/uk/number.txt +2 -0
- package/data/libpostal/dictionaries/uk/personal_titles.txt +9 -0
- package/data/libpostal/dictionaries/uk/place_names.txt +161 -0
- package/data/libpostal/dictionaries/uk/post_office.txt +2 -0
- package/data/libpostal/dictionaries/uk/qualifiers.txt +8 -0
- package/data/libpostal/dictionaries/uk/staircases.txt +2 -0
- package/data/libpostal/dictionaries/uk/stopwords.txt +2 -0
- package/data/libpostal/dictionaries/uk/street_types.txt +26 -0
- package/data/libpostal/dictionaries/uk/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/uk/unit_types_numbered.txt +10 -0
- package/data/libpostal/dictionaries/ur/street_types.txt +7 -0
- package/data/libpostal/dictionaries/vi/ambiguous_expansions.txt +3 -0
- package/data/libpostal/dictionaries/vi/personal_titles.txt +1 -0
- package/data/libpostal/dictionaries/vi/place_names.txt +29 -0
- package/data/libpostal/dictionaries/vi/qualifiers.txt +5 -0
- package/data/libpostal/dictionaries/vi/street_types.txt +10 -0
- package/data/libpostal/dictionaries/zh/building_types.txt +2 -0
- package/data/libpostal/dictionaries/zh/chains.txt +2 -0
- package/data/libpostal/dictionaries/zh/directionals.txt +20 -0
- package/data/libpostal/dictionaries/zh/level_types_numbered.txt +5 -0
- package/data/libpostal/dictionaries/zh/number.txt +3 -0
- package/data/libpostal/dictionaries/zh/place_names.txt +2 -0
- package/data/libpostal/dictionaries/zh/post_office.txt +3 -0
- package/data/libpostal/dictionaries/zh/postcodes.txt +3 -0
- package/data/libpostal/dictionaries/zh/qualifiers.txt +19 -0
- package/data/libpostal/dictionaries/zh/stopwords.txt +2 -0
- package/data/libpostal/dictionaries/zh/street_types.txt +30 -0
- package/data/libpostal/dictionaries/zh/unit_types_numbered.txt +2 -0
- package/data/libpostal/resources-download.sh +44 -0
- package/data/whosonfirst/dictionaries/country/name:eng_x_preferred.txt +220 -0
- package/data/whosonfirst/dictionaries/country/wof:country.txt +215 -0
- package/data/whosonfirst/dictionaries/country/wof:country_alpha3.txt +216 -0
- package/data/whosonfirst/dictionaries/dependency/name:eng_x_preferred.txt +42 -0
- package/data/whosonfirst/dictionaries/dependency/wof:shortcode.txt +34 -0
- package/data/whosonfirst/dictionaries/locality/name:eng_x_preferred.txt +261365 -0
- package/data/whosonfirst/dictionaries/locality/name:fra_x_preferred.txt +77631 -0
- package/data/whosonfirst/dictionaries/region/abrv:eng_x_preferred.txt +441 -0
- package/data/whosonfirst/dictionaries/region/name:eng_x_preferred.txt +4517 -0
- package/data/whosonfirst/dictionaries/region/wof:shortcode.txt +839 -0
- package/out/classification/BaseClassifier.d.ts +38 -0
- package/out/classification/BaseClassifier.d.ts.map +1 -0
- package/out/classification/BaseClassifier.js +12 -0
- package/out/classification/BaseClassifier.js.map +1 -0
- package/out/classification/Classification.d.ts +79 -0
- package/out/classification/Classification.d.ts.map +1 -0
- package/out/classification/Classification.js +133 -0
- package/out/classification/Classification.js.map +1 -0
- package/out/classification/CompositeClassifier.d.ts +16 -0
- package/out/classification/CompositeClassifier.d.ts.map +1 -0
- package/out/classification/CompositeClassifier.js +113 -0
- package/out/classification/CompositeClassifier.js.map +1 -0
- package/out/classification/PhraseClassifier.d.ts +23 -0
- package/out/classification/PhraseClassifier.d.ts.map +1 -0
- package/out/classification/PhraseClassifier.js +32 -0
- package/out/classification/PhraseClassifier.js.map +1 -0
- package/out/classification/SectionClassifier.d.ts +23 -0
- package/out/classification/SectionClassifier.d.ts.map +1 -0
- package/out/classification/SectionClassifier.js +27 -0
- package/out/classification/SectionClassifier.js.map +1 -0
- package/out/classification/WordClassifier.d.ts +22 -0
- package/out/classification/WordClassifier.d.ts.map +1 -0
- package/out/classification/WordClassifier.js +33 -0
- package/out/classification/WordClassifier.js.map +1 -0
- package/out/classification/index.d.ts +13 -0
- package/out/classification/index.d.ts.map +1 -0
- package/out/classification/index.js +13 -0
- package/out/classification/index.js.map +1 -0
- package/out/classification/scheme.d.ts +46 -0
- package/out/classification/scheme.d.ts.map +1 -0
- package/out/classification/scheme.js +37 -0
- package/out/classification/scheme.js.map +1 -0
- package/out/decoder/build-tree.d.ts +31 -0
- package/out/decoder/build-tree.d.ts.map +1 -0
- package/out/decoder/build-tree.js +100 -0
- package/out/decoder/build-tree.js.map +1 -0
- package/out/decoder/containment.d.ts +19 -0
- package/out/decoder/containment.d.ts.map +1 -0
- package/out/decoder/containment.js +47 -0
- package/out/decoder/containment.js.map +1 -0
- package/out/decoder/index.d.ts +13 -0
- package/out/decoder/index.d.ts.map +1 -0
- package/out/decoder/index.js +13 -0
- package/out/decoder/index.js.map +1 -0
- package/out/decoder/proposals-to-tree.d.ts +19 -0
- package/out/decoder/proposals-to-tree.d.ts.map +1 -0
- package/out/decoder/proposals-to-tree.js +28 -0
- package/out/decoder/proposals-to-tree.js.map +1 -0
- package/out/decoder/serialize-json.d.ts +15 -0
- package/out/decoder/serialize-json.d.ts.map +1 -0
- package/out/decoder/serialize-json.js +24 -0
- package/out/decoder/serialize-json.js.map +1 -0
- package/out/decoder/serialize-tuples.d.ts +16 -0
- package/out/decoder/serialize-tuples.d.ts.map +1 -0
- package/out/decoder/serialize-tuples.js +25 -0
- package/out/decoder/serialize-tuples.js.map +1 -0
- package/out/decoder/serialize-xml.d.ts +36 -0
- package/out/decoder/serialize-xml.d.ts.map +1 -0
- package/out/decoder/serialize-xml.js +60 -0
- package/out/decoder/serialize-xml.js.map +1 -0
- package/out/decoder/types.d.ts +71 -0
- package/out/decoder/types.d.ts.map +1 -0
- package/out/decoder/types.js +23 -0
- package/out/decoder/types.js.map +1 -0
- package/out/filters/InvalidSolutionFilter.d.ts +19 -0
- package/out/filters/InvalidSolutionFilter.d.ts.map +1 -0
- package/out/filters/InvalidSolutionFilter.js +29 -0
- package/out/filters/InvalidSolutionFilter.js.map +1 -0
- package/out/filters/RelationshipFilter.d.ts +14 -0
- package/out/filters/RelationshipFilter.d.ts.map +1 -0
- package/out/filters/RelationshipFilter.js +64 -0
- package/out/filters/RelationshipFilter.js.map +1 -0
- package/out/filters/SubsetFilter.d.ts +10 -0
- package/out/filters/SubsetFilter.d.ts.map +1 -0
- package/out/filters/SubsetFilter.js +26 -0
- package/out/filters/SubsetFilter.js.map +1 -0
- package/out/filters/TokenDistanceFilter.d.ts +10 -0
- package/out/filters/TokenDistanceFilter.d.ts.map +1 -0
- package/out/filters/TokenDistanceFilter.js +30 -0
- package/out/filters/TokenDistanceFilter.js.map +1 -0
- package/out/filters/index.d.ts +10 -0
- package/out/filters/index.d.ts.map +1 -0
- package/out/filters/index.js +10 -0
- package/out/filters/index.js.map +1 -0
- package/out/formatter/index.d.ts +11 -0
- package/out/formatter/index.d.ts.map +1 -0
- package/out/formatter/index.js +49 -0
- package/out/formatter/index.js.map +1 -0
- package/out/index.d.ts +14 -0
- package/out/index.d.ts.map +1 -0
- package/out/index.js +18 -0
- package/out/index.js.map +1 -0
- package/out/locale/index.d.ts +9 -0
- package/out/locale/index.d.ts.map +1 -0
- package/out/locale/index.js +9 -0
- package/out/locale/index.js.map +1 -0
- package/out/locale/locale.d.ts +43 -0
- package/out/locale/locale.d.ts.map +1 -0
- package/out/locale/locale.js +16 -0
- package/out/locale/locale.js.map +1 -0
- package/out/locale/profiles/en-us.d.ts +12 -0
- package/out/locale/profiles/en-us.d.ts.map +1 -0
- package/out/locale/profiles/en-us.js +67 -0
- package/out/locale/profiles/en-us.js.map +1 -0
- package/out/locale/profiles/fr-fr.d.ts +14 -0
- package/out/locale/profiles/fr-fr.d.ts.map +1 -0
- package/out/locale/profiles/fr-fr.js +73 -0
- package/out/locale/profiles/fr-fr.js.map +1 -0
- package/out/locale/profiles/index.d.ts +9 -0
- package/out/locale/profiles/index.d.ts.map +1 -0
- package/out/locale/profiles/index.js +9 -0
- package/out/locale/profiles/index.js.map +1 -0
- package/out/locale/profiles/ja-jp.d.ts +17 -0
- package/out/locale/profiles/ja-jp.d.ts.map +1 -0
- package/out/locale/profiles/ja-jp.js +31 -0
- package/out/locale/profiles/ja-jp.js.map +1 -0
- package/out/locale/registry.d.ts +20 -0
- package/out/locale/registry.d.ts.map +1 -0
- package/out/locale/registry.js +49 -0
- package/out/locale/registry.js.map +1 -0
- package/out/parser/AddressParser.d.ts +97 -0
- package/out/parser/AddressParser.d.ts.map +1 -0
- package/out/parser/AddressParser.js +116 -0
- package/out/parser/AddressParser.js.map +1 -0
- package/out/parser/index.d.ts +8 -0
- package/out/parser/index.d.ts.map +1 -0
- package/out/parser/index.js +8 -0
- package/out/parser/index.js.map +1 -0
- package/out/parser/proposal-pipeline.d.ts +67 -0
- package/out/parser/proposal-pipeline.d.ts.map +1 -0
- package/out/parser/proposal-pipeline.js +127 -0
- package/out/parser/proposal-pipeline.js.map +1 -0
- package/out/policy/defaults.d.ts +21 -0
- package/out/policy/defaults.d.ts.map +1 -0
- package/out/policy/defaults.js +27 -0
- package/out/policy/defaults.js.map +1 -0
- package/out/policy/index.d.ts +9 -0
- package/out/policy/index.d.ts.map +1 -0
- package/out/policy/index.js +9 -0
- package/out/policy/index.js.map +1 -0
- package/out/policy/policy.d.ts +57 -0
- package/out/policy/policy.d.ts.map +1 -0
- package/out/policy/policy.js +12 -0
- package/out/policy/policy.js.map +1 -0
- package/out/policy/registry.d.ts +31 -0
- package/out/policy/registry.d.ts.map +1 -0
- package/out/policy/registry.js +114 -0
- package/out/policy/registry.js.map +1 -0
- package/out/resources/LocaleIndex.d.ts +54 -0
- package/out/resources/LocaleIndex.d.ts.map +1 -0
- package/out/resources/LocaleIndex.js +91 -0
- package/out/resources/LocaleIndex.js.map +1 -0
- package/out/resources/ResourceMapCache.d.ts +40 -0
- package/out/resources/ResourceMapCache.d.ts.map +1 -0
- package/out/resources/ResourceMapCache.js +75 -0
- package/out/resources/ResourceMapCache.js.map +1 -0
- package/out/resources/collections.d.ts +28 -0
- package/out/resources/collections.d.ts.map +1 -0
- package/out/resources/collections.js +76 -0
- package/out/resources/collections.js.map +1 -0
- package/out/resources/db/index.d.ts +57 -0
- package/out/resources/db/index.d.ts.map +1 -0
- package/out/resources/db/index.js +57 -0
- package/out/resources/db/index.js.map +1 -0
- package/out/resources/debugging.d.ts +16 -0
- package/out/resources/debugging.d.ts.map +1 -0
- package/out/resources/debugging.js +12 -0
- package/out/resources/debugging.js.map +1 -0
- package/out/resources/fs.d.ts +12 -0
- package/out/resources/fs.d.ts.map +1 -0
- package/out/resources/fs.js +13 -0
- package/out/resources/fs.js.map +1 -0
- package/out/resources/git.d.ts +24 -0
- package/out/resources/git.d.ts.map +1 -0
- package/out/resources/git.js +36 -0
- package/out/resources/git.js.map +1 -0
- package/out/resources/index.d.ts +19 -0
- package/out/resources/index.d.ts.map +1 -0
- package/out/resources/index.js +19 -0
- package/out/resources/index.js.map +1 -0
- package/out/resources/languages/index.d.ts +24 -0
- package/out/resources/languages/index.d.ts.map +1 -0
- package/out/resources/languages/index.js +43 -0
- package/out/resources/languages/index.js.map +1 -0
- package/out/resources/languages/types.gen.d.ts +259 -0
- package/out/resources/languages/types.gen.d.ts.map +1 -0
- package/out/resources/languages/types.gen.js +983 -0
- package/out/resources/languages/types.gen.js.map +1 -0
- package/out/resources/libaddressinput.d.ts +103 -0
- package/out/resources/libaddressinput.d.ts.map +1 -0
- package/out/resources/libaddressinput.js +30 -0
- package/out/resources/libaddressinput.js.map +1 -0
- package/out/resources/libpostal.d.ts +31 -0
- package/out/resources/libpostal.d.ts.map +1 -0
- package/out/resources/libpostal.js +117 -0
- package/out/resources/libpostal.js.map +1 -0
- package/out/resources/locale.d.ts +14 -0
- package/out/resources/locale.d.ts.map +1 -0
- package/out/resources/locale.js +22 -0
- package/out/resources/locale.js.map +1 -0
- package/out/resources/set.d.ts +62 -0
- package/out/resources/set.d.ts.map +1 -0
- package/out/resources/set.js +149 -0
- package/out/resources/set.js.map +1 -0
- package/out/resources/whosonfirst/DataSourceCache.d.ts +18 -0
- package/out/resources/whosonfirst/DataSourceCache.d.ts.map +1 -0
- package/out/resources/whosonfirst/DataSourceCache.js +53 -0
- package/out/resources/whosonfirst/DataSourceCache.js.map +1 -0
- package/out/resources/whosonfirst/PlacetypeDataSource.d.ts +74 -0
- package/out/resources/whosonfirst/PlacetypeDataSource.d.ts.map +1 -0
- package/out/resources/whosonfirst/PlacetypeDataSource.js +111 -0
- package/out/resources/whosonfirst/PlacetypeDataSource.js.map +1 -0
- package/out/resources/whosonfirst/index.d.ts +10 -0
- package/out/resources/whosonfirst/index.d.ts.map +1 -0
- package/out/resources/whosonfirst/index.js +10 -0
- package/out/resources/whosonfirst/index.js.map +1 -0
- package/out/resources/whosonfirst/loader.d.ts +56 -0
- package/out/resources/whosonfirst/loader.d.ts.map +1 -0
- package/out/resources/whosonfirst/loader.js +115 -0
- package/out/resources/whosonfirst/loader.js.map +1 -0
- package/out/resources/whosonfirst/placetypes/Placetype.d.ts +128 -0
- package/out/resources/whosonfirst/placetypes/Placetype.d.ts.map +1 -0
- package/out/resources/whosonfirst/placetypes/Placetype.js +338 -0
- package/out/resources/whosonfirst/placetypes/Placetype.js.map +1 -0
- package/out/resources/whosonfirst/placetypes/admin.d.ts +48 -0
- package/out/resources/whosonfirst/placetypes/admin.d.ts.map +1 -0
- package/out/resources/whosonfirst/placetypes/admin.js +61 -0
- package/out/resources/whosonfirst/placetypes/admin.js.map +1 -0
- package/out/resources/whosonfirst/placetypes/definition.d.ts +73 -0
- package/out/resources/whosonfirst/placetypes/definition.d.ts.map +1 -0
- package/out/resources/whosonfirst/placetypes/definition.js +26 -0
- package/out/resources/whosonfirst/placetypes/definition.js.map +1 -0
- package/out/resources/whosonfirst/placetypes/index.d.ts +10 -0
- package/out/resources/whosonfirst/placetypes/index.d.ts.map +1 -0
- package/out/resources/whosonfirst/placetypes/index.js +10 -0
- package/out/resources/whosonfirst/placetypes/index.js.map +1 -0
- package/out/resources/whosonfirst/placetypes/mermaid.d.ts +20 -0
- package/out/resources/whosonfirst/placetypes/mermaid.d.ts.map +1 -0
- package/out/resources/whosonfirst/placetypes/mermaid.js +44 -0
- package/out/resources/whosonfirst/placetypes/mermaid.js.map +1 -0
- package/out/solver/BaseSolver.d.ts +24 -0
- package/out/solver/BaseSolver.d.ts.map +1 -0
- package/out/solver/BaseSolver.js +7 -0
- package/out/solver/BaseSolver.js.map +1 -0
- package/out/solver/HashMapSolver.d.ts +15 -0
- package/out/solver/HashMapSolver.d.ts.map +1 -0
- package/out/solver/HashMapSolver.js +61 -0
- package/out/solver/HashMapSolver.js.map +1 -0
- package/out/solver/Solution.d.ts +69 -0
- package/out/solver/Solution.d.ts.map +1 -0
- package/out/solver/Solution.js +137 -0
- package/out/solver/Solution.js.map +1 -0
- package/out/solver/SolutionMatch.d.ts +69 -0
- package/out/solver/SolutionMatch.d.ts.map +1 -0
- package/out/solver/SolutionMatch.js +101 -0
- package/out/solver/SolutionMatch.js.map +1 -0
- package/out/solver/index.d.ts +11 -0
- package/out/solver/index.d.ts.map +1 -0
- package/out/solver/index.js +11 -0
- package/out/solver/index.js.map +1 -0
- package/out/solver/mask.d.ts +27 -0
- package/out/solver/mask.d.ts.map +1 -0
- package/out/solver/mask.js +52 -0
- package/out/solver/mask.js.map +1 -0
- package/out/solvers/ExclusiveCartesianSolver.d.ts +12 -0
- package/out/solvers/ExclusiveCartesianSolver.d.ts.map +1 -0
- package/out/solvers/ExclusiveCartesianSolver.js +58 -0
- package/out/solvers/ExclusiveCartesianSolver.js.map +1 -0
- package/out/solvers/HouseNumberPositionPenalty.d.ts +10 -0
- package/out/solvers/HouseNumberPositionPenalty.d.ts.map +1 -0
- package/out/solvers/HouseNumberPositionPenalty.js +63 -0
- package/out/solvers/HouseNumberPositionPenalty.js.map +1 -0
- package/out/solvers/LeadingAreaDeclassifier.d.ts +13 -0
- package/out/solvers/LeadingAreaDeclassifier.d.ts.map +1 -0
- package/out/solvers/LeadingAreaDeclassifier.js +35 -0
- package/out/solvers/LeadingAreaDeclassifier.js.map +1 -0
- package/out/solvers/MultiStreetSolver.d.ts +32 -0
- package/out/solvers/MultiStreetSolver.d.ts.map +1 -0
- package/out/solvers/MultiStreetSolver.js +110 -0
- package/out/solvers/MultiStreetSolver.js.map +1 -0
- package/out/solvers/OrphanedLevelTypeDeclassifier.d.ts +10 -0
- package/out/solvers/OrphanedLevelTypeDeclassifier.d.ts.map +1 -0
- package/out/solvers/OrphanedLevelTypeDeclassifier.js +21 -0
- package/out/solvers/OrphanedLevelTypeDeclassifier.js.map +1 -0
- package/out/solvers/OrphanedUnitTypeDeclassifier.d.ts +10 -0
- package/out/solvers/OrphanedUnitTypeDeclassifier.d.ts.map +1 -0
- package/out/solvers/OrphanedUnitTypeDeclassifier.js +21 -0
- package/out/solvers/OrphanedUnitTypeDeclassifier.js.map +1 -0
- package/out/solvers/PostcodePositionPenalty.d.ts +16 -0
- package/out/solvers/PostcodePositionPenalty.d.ts.map +1 -0
- package/out/solvers/PostcodePositionPenalty.js +33 -0
- package/out/solvers/PostcodePositionPenalty.js.map +1 -0
- package/out/solvers/VenueCaptureSolver.d.ts +13 -0
- package/out/solvers/VenueCaptureSolver.d.ts.map +1 -0
- package/out/solvers/VenueCaptureSolver.js +22 -0
- package/out/solvers/VenueCaptureSolver.js.map +1 -0
- package/out/solvers/index.d.ts +14 -0
- package/out/solvers/index.d.ts.map +1 -0
- package/out/solvers/index.js +14 -0
- package/out/solvers/index.js.map +1 -0
- package/out/tokenization/Graph.d.ts +35 -0
- package/out/tokenization/Graph.d.ts.map +1 -0
- package/out/tokenization/Graph.js +38 -0
- package/out/tokenization/Graph.js.map +1 -0
- package/out/tokenization/Span.d.ts +115 -0
- package/out/tokenization/Span.d.ts.map +1 -0
- package/out/tokenization/Span.js +223 -0
- package/out/tokenization/Span.js.map +1 -0
- package/out/tokenization/context.d.ts +39 -0
- package/out/tokenization/context.d.ts.map +1 -0
- package/out/tokenization/context.js +114 -0
- package/out/tokenization/context.js.map +1 -0
- package/out/tokenization/index.d.ts +11 -0
- package/out/tokenization/index.d.ts.map +1 -0
- package/out/tokenization/index.js +11 -0
- package/out/tokenization/index.js.map +1 -0
- package/out/tokenization/normalizer.d.ts +41 -0
- package/out/tokenization/normalizer.d.ts.map +1 -0
- package/out/tokenization/normalizer.js +94 -0
- package/out/tokenization/normalizer.js.map +1 -0
- package/out/tokenization/permutate.d.ts +29 -0
- package/out/tokenization/permutate.d.ts.map +1 -0
- package/out/tokenization/permutate.js +73 -0
- package/out/tokenization/permutate.js.map +1 -0
- package/out/tokenization/split.d.ts +22 -0
- package/out/tokenization/split.d.ts.map +1 -0
- package/out/tokenization/split.js +63 -0
- package/out/tokenization/split.js.map +1 -0
- package/out/types/classifier.d.ts +117 -0
- package/out/types/classifier.d.ts.map +1 -0
- package/out/types/classifier.js +19 -0
- package/out/types/classifier.js.map +1 -0
- package/out/types/component.d.ts +42 -0
- package/out/types/component.d.ts.map +1 -0
- package/out/types/component.js +69 -0
- package/out/types/component.js.map +1 -0
- package/out/types/index.d.ts +9 -0
- package/out/types/index.d.ts.map +1 -0
- package/out/types/index.js +9 -0
- package/out/types/index.js.map +1 -0
- package/out/types/mapping.d.ts +38 -0
- package/out/types/mapping.d.ts.map +1 -0
- package/out/types/mapping.js +71 -0
- package/out/types/mapping.js.map +1 -0
- package/out/utils/index.d.ts +7 -0
- package/out/utils/index.d.ts.map +1 -0
- package/out/utils/index.js +7 -0
- package/out/utils/index.js.map +1 -0
- package/out/utils/repo.d.ts +42 -0
- package/out/utils/repo.d.ts.map +1 -0
- package/out/utils/repo.js +72 -0
- package/out/utils/repo.js.map +1 -0
- package/out/vitest.config.d.ts +15 -0
- package/out/vitest.config.d.ts.map +1 -0
- package/out/vitest.config.js +45 -0
- package/out/vitest.config.js.map +1 -0
- package/package.json +45 -0
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../tokenization/index.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,cAAc,cAAc,CAAA;AAC5B,cAAc,YAAY,CAAA;AAC1B,cAAc,iBAAiB,CAAA;AAC/B,cAAc,gBAAgB,CAAA;AAC9B,cAAc,WAAW,CAAA"}
|
|
@@ -0,0 +1,41 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
export interface TextNormalizerReplaceClause {
|
|
7
|
+
from: string | RegExp;
|
|
8
|
+
to: string;
|
|
9
|
+
}
|
|
10
|
+
export interface TextNormalizerInit {
|
|
11
|
+
lowercase?: boolean;
|
|
12
|
+
removeAccents?: boolean;
|
|
13
|
+
removeHyphen?: boolean;
|
|
14
|
+
removeSpaces?: boolean;
|
|
15
|
+
minLength?: number;
|
|
16
|
+
maxLength?: number;
|
|
17
|
+
replace?: TextNormalizerReplaceClause[];
|
|
18
|
+
}
|
|
19
|
+
/**
|
|
20
|
+
* Normalizes text values, i.e. removes superfluous characters such as accents, hyphens, and spaces.
|
|
21
|
+
*/
|
|
22
|
+
export declare class TextNormalizer implements TextNormalizerInit {
|
|
23
|
+
readonly lowercase: boolean;
|
|
24
|
+
readonly removeAccents: boolean;
|
|
25
|
+
readonly removeHyphen: boolean;
|
|
26
|
+
readonly removeSpaces: boolean;
|
|
27
|
+
readonly replace: TextNormalizerReplaceClause[];
|
|
28
|
+
readonly minLength?: number;
|
|
29
|
+
readonly maxLength?: number;
|
|
30
|
+
constructor(init?: TextNormalizerInit);
|
|
31
|
+
/**
|
|
32
|
+
* Perform text normalization on a given input.
|
|
33
|
+
*/
|
|
34
|
+
normalize(input: string): string;
|
|
35
|
+
/**
|
|
36
|
+
* Validate a given input against the defined validations.
|
|
37
|
+
*/
|
|
38
|
+
validate(input: string): boolean;
|
|
39
|
+
toJSON(): TextNormalizerInit;
|
|
40
|
+
}
|
|
41
|
+
//# sourceMappingURL=normalizer.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"normalizer.d.ts","sourceRoot":"","sources":["../../tokenization/normalizer.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAoBH,MAAM,WAAW,2BAA2B;IAC3C,IAAI,EAAE,MAAM,GAAG,MAAM,CAAA;IACrB,EAAE,EAAE,MAAM,CAAA;CACV;AAED,MAAM,WAAW,kBAAkB;IAClC,SAAS,CAAC,EAAE,OAAO,CAAA;IACnB,aAAa,CAAC,EAAE,OAAO,CAAA;IACvB,YAAY,CAAC,EAAE,OAAO,CAAA;IACtB,YAAY,CAAC,EAAE,OAAO,CAAA;IACtB,SAAS,CAAC,EAAE,MAAM,CAAA;IAClB,SAAS,CAAC,EAAE,MAAM,CAAA;IAClB,OAAO,CAAC,EAAE,2BAA2B,EAAE,CAAA;CACvC;AAED;;GAEG;AACH,qBAAa,cAAe,YAAW,kBAAkB;IACxD,SAAgB,SAAS,EAAE,OAAO,CAAA;IAClC,SAAgB,aAAa,EAAE,OAAO,CAAA;IACtC,SAAgB,YAAY,EAAE,OAAO,CAAA;IACrC,SAAgB,YAAY,EAAE,OAAO,CAAA;IACrC,SAAgB,OAAO,EAAE,2BAA2B,EAAE,CAAA;IACtD,SAAgB,SAAS,CAAC,EAAE,MAAM,CAAA;IAClC,SAAgB,SAAS,CAAC,EAAE,MAAM,CAAA;gBAEtB,IAAI,GAAE,kBAAuB;IAUzC;;OAEG;IACI,SAAS,CAAC,KAAK,EAAE,MAAM,GAAG,MAAM;IAgCvC;;OAEG;IACI,QAAQ,CAAC,KAAK,EAAE,MAAM,GAAG,OAAO;IAYhC,MAAM,IAAI,kBAAkB;CAWnC"}
|
|
@@ -0,0 +1,94 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
import regenerate from "regenerate";
|
|
7
|
+
/**
|
|
8
|
+
* A pattern matching combining diacritical marks, variation selectors, and other characters that
|
|
9
|
+
* are often used in text normalization.
|
|
10
|
+
*/
|
|
11
|
+
const CombiningDiacriticalPattern = regenerate()
|
|
12
|
+
.add(0x200d) // ZERO WIDTH JOINER (U+200D)
|
|
13
|
+
.addRange(0x0300, 0x036f) // Combining Diacritical Marks
|
|
14
|
+
.addRange(0x1ab0, 0x1aff) // Combining Diacritical Marks Extended
|
|
15
|
+
.addRange(0x1dc0, 0x1dff) // Combining Diacritical Marks Supplement
|
|
16
|
+
.addRange(0x20d0, 0x20ff) // Combining Diacritical Marks for Symbols
|
|
17
|
+
.addRange(0xfe00, 0xfe0f) // Variation Selectors
|
|
18
|
+
.addRange(0xfe20, 0xfe2f) // Combining Half Marks
|
|
19
|
+
.add(0x3099) // Combining Dakuten
|
|
20
|
+
.add(0x309a) // Combining Handakuten
|
|
21
|
+
.toRegExp("g");
|
|
22
|
+
/**
|
|
23
|
+
* Normalizes text values, i.e. removes superfluous characters such as accents, hyphens, and spaces.
|
|
24
|
+
*/
|
|
25
|
+
export class TextNormalizer {
|
|
26
|
+
lowercase;
|
|
27
|
+
removeAccents;
|
|
28
|
+
removeHyphen;
|
|
29
|
+
removeSpaces;
|
|
30
|
+
replace;
|
|
31
|
+
minLength;
|
|
32
|
+
maxLength;
|
|
33
|
+
constructor(init = {}) {
|
|
34
|
+
this.lowercase = init.lowercase ?? false;
|
|
35
|
+
this.removeAccents = init.removeAccents ?? false;
|
|
36
|
+
this.removeHyphen = init.removeHyphen ?? false;
|
|
37
|
+
this.removeSpaces = init.removeSpaces ?? false;
|
|
38
|
+
this.replace = init.replace ?? [];
|
|
39
|
+
this.minLength = init.minLength;
|
|
40
|
+
this.maxLength = init.maxLength;
|
|
41
|
+
}
|
|
42
|
+
/**
|
|
43
|
+
* Perform text normalization on a given input.
|
|
44
|
+
*/
|
|
45
|
+
normalize(input) {
|
|
46
|
+
input = input.trim();
|
|
47
|
+
for (const { from, to } of this.replace) {
|
|
48
|
+
input = input.replace(from, to);
|
|
49
|
+
}
|
|
50
|
+
if (this.lowercase) {
|
|
51
|
+
input = input.toLowerCase();
|
|
52
|
+
}
|
|
53
|
+
if (this.removeAccents) {
|
|
54
|
+
input = input
|
|
55
|
+
// We first normalize to NFKD to decompose any accented characters...
|
|
56
|
+
.normalize("NFKD")
|
|
57
|
+
// Then we remove the accented characters...
|
|
58
|
+
.replace(CombiningDiacriticalPattern, "")
|
|
59
|
+
// And finally we normalize to NFKC to recompose the string.
|
|
60
|
+
.normalize("NFKC");
|
|
61
|
+
}
|
|
62
|
+
if (this.removeHyphen) {
|
|
63
|
+
input = input.replace(/-/g, " ");
|
|
64
|
+
}
|
|
65
|
+
if (this.removeSpaces) {
|
|
66
|
+
input = input.replace(/ /g, "");
|
|
67
|
+
}
|
|
68
|
+
return input;
|
|
69
|
+
}
|
|
70
|
+
/**
|
|
71
|
+
* Validate a given input against the defined validations.
|
|
72
|
+
*/
|
|
73
|
+
validate(input) {
|
|
74
|
+
if (this.minLength && input.length < this.minLength) {
|
|
75
|
+
return false;
|
|
76
|
+
}
|
|
77
|
+
if (this.maxLength && input.length > this.maxLength) {
|
|
78
|
+
return false;
|
|
79
|
+
}
|
|
80
|
+
return true;
|
|
81
|
+
}
|
|
82
|
+
toJSON() {
|
|
83
|
+
return {
|
|
84
|
+
lowercase: this.lowercase,
|
|
85
|
+
removeAccents: this.removeAccents,
|
|
86
|
+
removeHyphen: this.removeHyphen,
|
|
87
|
+
removeSpaces: this.removeSpaces,
|
|
88
|
+
replace: this.replace,
|
|
89
|
+
minLength: this.minLength,
|
|
90
|
+
maxLength: this.maxLength,
|
|
91
|
+
};
|
|
92
|
+
}
|
|
93
|
+
}
|
|
94
|
+
//# sourceMappingURL=normalizer.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"normalizer.js","sourceRoot":"","sources":["../../tokenization/normalizer.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,UAAU,MAAM,YAAY,CAAA;AAEnC;;;GAGG;AACH,MAAM,2BAA2B,GAAG,UAAU,EAAE;KAC9C,GAAG,CAAC,MAAM,CAAC,CAAC,6BAA6B;KACzC,QAAQ,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC,8BAA8B;KACvD,QAAQ,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC,uCAAuC;KAChE,QAAQ,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC,yCAAyC;KAClE,QAAQ,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC,0CAA0C;KACnE,QAAQ,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC,sBAAsB;KAC/C,QAAQ,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC,uBAAuB;KAChD,GAAG,CAAC,MAAM,CAAC,CAAC,oBAAoB;KAChC,GAAG,CAAC,MAAM,CAAC,CAAC,uBAAuB;KACnC,QAAQ,CAAC,GAAG,CAAC,CAAA;AAiBf;;GAEG;AACH,MAAM,OAAO,cAAc;IACV,SAAS,CAAS;IAClB,aAAa,CAAS;IACtB,YAAY,CAAS;IACrB,YAAY,CAAS;IACrB,OAAO,CAA+B;IACtC,SAAS,CAAS;IAClB,SAAS,CAAS;IAElC,YAAY,OAA2B,EAAE;QACxC,IAAI,CAAC,SAAS,GAAG,IAAI,CAAC,SAAS,IAAI,KAAK,CAAA;QACxC,IAAI,CAAC,aAAa,GAAG,IAAI,CAAC,aAAa,IAAI,KAAK,CAAA;QAChD,IAAI,CAAC,YAAY,GAAG,IAAI,CAAC,YAAY,IAAI,KAAK,CAAA;QAC9C,IAAI,CAAC,YAAY,GAAG,IAAI,CAAC,YAAY,IAAI,KAAK,CAAA;QAC9C,IAAI,CAAC,OAAO,GAAG,IAAI,CAAC,OAAO,IAAI,EAAE,CAAA;QACjC,IAAI,CAAC,SAAS,GAAG,IAAI,CAAC,SAAS,CAAA;QAC/B,IAAI,CAAC,SAAS,GAAG,IAAI,CAAC,SAAS,CAAA;IAChC,CAAC;IAED;;OAEG;IACI,SAAS,CAAC,KAAa;QAC7B,KAAK,GAAG,KAAK,CAAC,IAAI,EAAE,CAAA;QAEpB,KAAK,MAAM,EAAE,IAAI,EAAE,EAAE,EAAE,IAAI,IAAI,CAAC,OAAO,EAAE,CAAC;YACzC,KAAK,GAAG,KAAK,CAAC,OAAO,CAAC,IAAI,EAAE,EAAE,CAAC,CAAA;QAChC,CAAC;QAED,IAAI,IAAI,CAAC,SAAS,EAAE,CAAC;YACpB,KAAK,GAAG,KAAK,CAAC,WAAW,EAAE,CAAA;QAC5B,CAAC;QAED,IAAI,IAAI,CAAC,aAAa,EAAE,CAAC;YACxB,KAAK,GAAG,KAAK;gBACZ,qEAAqE;iBACpE,SAAS,CAAC,MAAM,CAAC;gBAClB,4CAA4C;iBAC3C,OAAO,CAAC,2BAA2B,EAAE,EAAE,CAAC;gBACzC,4DAA4D;iBAC3D,SAAS,CAAC,MAAM,CAAC,CAAA;QACpB,CAAC;QAED,IAAI,IAAI,CAAC,YAAY,EAAE,CAAC;YACvB,KAAK,GAAG,KAAK,CAAC,OAAO,CAAC,IAAI,EAAE,GAAG,CAAC,CAAA;QACjC,CAAC;QAED,IAAI,IAAI,CAAC,YAAY,EAAE,CAAC;YACvB,KAAK,GAAG,KAAK,CAAC,OAAO,CAAC,IAAI,EAAE,EAAE,CAAC,CAAA;QAChC,CAAC;QAED,OAAO,KAAK,CAAA;IACb,CAAC;IAED;;OAEG;IACI,QAAQ,CAAC,KAAa;QAC5B,IAAI,IAAI,CAAC,SAAS,IAAI,KAAK,CAAC,MAAM,GAAG,IAAI,CAAC,SAAS,EAAE,CAAC;YACrD,OAAO,KAAK,CAAA;QACb,CAAC;QAED,IAAI,IAAI,CAAC,SAAS,IAAI,KAAK,CAAC,MAAM,GAAG,IAAI,CAAC,SAAS,EAAE,CAAC;YACrD,OAAO,KAAK,CAAA;QACb,CAAC;QAED,OAAO,IAAI,CAAA;IACZ,CAAC;IAEM,MAAM;QACZ,OAAO;YACN,SAAS,EAAE,IAAI,CAAC,SAAS;YACzB,aAAa,EAAE,IAAI,CAAC,aAAa;YACjC,YAAY,EAAE,IAAI,CAAC,YAAY;YAC/B,YAAY,EAAE,IAAI,CAAC,YAAY;YAC/B,OAAO,EAAE,IAAI,CAAC,OAAO;YACrB,SAAS,EAAE,IAAI,CAAC,SAAS;YACzB,SAAS,EAAE,IAAI,CAAC,SAAS;SACzB,CAAA;IACF,CAAC;CACD"}
|
|
@@ -0,0 +1,29 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
import { Span } from "./Span.js";
|
|
7
|
+
export interface PermutateOptions {
|
|
8
|
+
/**
|
|
9
|
+
* The minimum amount of tokens which can be returned in a single window.
|
|
10
|
+
*/
|
|
11
|
+
from: number;
|
|
12
|
+
/**
|
|
13
|
+
* The maximum amount of tokens which can be returned in a single window.
|
|
14
|
+
*/
|
|
15
|
+
to: number;
|
|
16
|
+
}
|
|
17
|
+
/**
|
|
18
|
+
* Produce all the possible token groups from adjacent input tokens (without reordering tokens).
|
|
19
|
+
*
|
|
20
|
+
* Example: ['soho', 'new', 'york', 'usa'] [ ['soho', 'new', 'york', 'usa'], ['soho', 'new',
|
|
21
|
+
* 'york'], ['soho', 'new'], ['soho'], ['new', 'york', 'usa'], ['new', 'york'], ['new'], ['york',
|
|
22
|
+
* 'usa'], ['york'], ['usa'], ]
|
|
23
|
+
*
|
|
24
|
+
* @param spans - The spans to permutate
|
|
25
|
+
*
|
|
26
|
+
* @returns The permutations
|
|
27
|
+
*/
|
|
28
|
+
export declare function permutate(spans: Iterable<Span>, { from, to }: PermutateOptions): Span[];
|
|
29
|
+
//# sourceMappingURL=permutate.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"permutate.d.ts","sourceRoot":"","sources":["../../tokenization/permutate.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,EAAE,IAAI,EAAE,MAAM,WAAW,CAAA;AAiEhC,MAAM,WAAW,gBAAgB;IAChC;;OAEG;IACH,IAAI,EAAE,MAAM,CAAA;IAEZ;;OAEG;IACH,EAAE,EAAE,MAAM,CAAA;CACV;AAED;;;;;;;;;;GAUG;AACH,wBAAgB,SAAS,CAAC,KAAK,EAAE,QAAQ,CAAC,IAAI,CAAC,EAAE,EAAE,IAAI,EAAE,EAAE,EAAE,EAAE,gBAAgB,GAAG,IAAI,EAAE,CAQvF"}
|
|
@@ -0,0 +1,73 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
import { Span } from "./Span.js";
|
|
7
|
+
const JOIN_CHAR = " ";
|
|
8
|
+
/**
|
|
9
|
+
* Produce all the possible token groups from adjacent input tokens (without reordering tokens)
|
|
10
|
+
*
|
|
11
|
+
* WindowMin: the minimum amount of tokens which can be returned in a single window windowMax: the
|
|
12
|
+
* maximum amount of tokens which can be returned in a single window
|
|
13
|
+
*
|
|
14
|
+
* Note: we should honor word boundary delimiters (such as comma) when creating permutations ported:
|
|
15
|
+
* https://github.com/pelias/placeholder/blob/master/lib/permutations.js
|
|
16
|
+
*/
|
|
17
|
+
function permutateRec(prevSpan, currentSpan, windowCur, windowMin, windowMax, permutations) {
|
|
18
|
+
// Stops when the window is reached
|
|
19
|
+
if (windowCur > windowMax)
|
|
20
|
+
return;
|
|
21
|
+
// Create new span base on the previous and the next one
|
|
22
|
+
const span = new Span(prevSpan.body + (prevSpan.body.length > 0 ? JOIN_CHAR : "") + currentSpan.body, prevSpan.start);
|
|
23
|
+
// Add all children from the previous span to the new one, they will have the same ones + the next one
|
|
24
|
+
// Add to all children from the previous span the new span as parent + the next one
|
|
25
|
+
prevSpan.children.forEach((child) => {
|
|
26
|
+
span.children.add(child);
|
|
27
|
+
child.parents.add(span);
|
|
28
|
+
});
|
|
29
|
+
span.children.add(currentSpan);
|
|
30
|
+
currentSpan.parents.add(span);
|
|
31
|
+
const isFirst = span.body === currentSpan.body;
|
|
32
|
+
const isLast = !currentSpan.nextSibling;
|
|
33
|
+
if (isFirst) {
|
|
34
|
+
span.start = currentSpan.start;
|
|
35
|
+
span.end = currentSpan.end;
|
|
36
|
+
}
|
|
37
|
+
else {
|
|
38
|
+
if (currentSpan.start < span.start) {
|
|
39
|
+
span.start = currentSpan.start;
|
|
40
|
+
}
|
|
41
|
+
if (currentSpan.end > span.end) {
|
|
42
|
+
span.end = currentSpan.end;
|
|
43
|
+
}
|
|
44
|
+
}
|
|
45
|
+
// go through the graph recursively, check all next spans
|
|
46
|
+
if (!isLast) {
|
|
47
|
+
currentSpan.nextSiblings.forEach((next) => {
|
|
48
|
+
permutateRec(span, next, windowCur + 1, windowMin, windowMax, permutations);
|
|
49
|
+
});
|
|
50
|
+
}
|
|
51
|
+
if (windowMin <= windowCur) {
|
|
52
|
+
permutations.push(span);
|
|
53
|
+
}
|
|
54
|
+
}
|
|
55
|
+
/**
|
|
56
|
+
* Produce all the possible token groups from adjacent input tokens (without reordering tokens).
|
|
57
|
+
*
|
|
58
|
+
* Example: ['soho', 'new', 'york', 'usa'] [ ['soho', 'new', 'york', 'usa'], ['soho', 'new',
|
|
59
|
+
* 'york'], ['soho', 'new'], ['soho'], ['new', 'york', 'usa'], ['new', 'york'], ['new'], ['york',
|
|
60
|
+
* 'usa'], ['york'], ['usa'], ]
|
|
61
|
+
*
|
|
62
|
+
* @param spans - The spans to permutate
|
|
63
|
+
*
|
|
64
|
+
* @returns The permutations
|
|
65
|
+
*/
|
|
66
|
+
export function permutate(spans, { from, to }) {
|
|
67
|
+
const permutations = [];
|
|
68
|
+
for (const span of spans) {
|
|
69
|
+
permutateRec(new Span(), span, 1, from, to, permutations);
|
|
70
|
+
}
|
|
71
|
+
return permutations;
|
|
72
|
+
}
|
|
73
|
+
//# sourceMappingURL=permutate.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"permutate.js","sourceRoot":"","sources":["../../tokenization/permutate.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,EAAE,IAAI,EAAE,MAAM,WAAW,CAAA;AAEhC,MAAM,SAAS,GAAG,GAAG,CAAA;AAErB;;;;;;;;GAQG;AACH,SAAS,YAAY,CACpB,QAAc,EACd,WAAiB,EACjB,SAAiB,EACjB,SAAiB,EACjB,SAAiB,EACjB,YAAoB;IAEpB,mCAAmC;IACnC,IAAI,SAAS,GAAG,SAAS;QAAE,OAAM;IAEjC,wDAAwD;IACxD,MAAM,IAAI,GAAG,IAAI,IAAI,CAAC,QAAQ,CAAC,IAAI,GAAG,CAAC,QAAQ,CAAC,IAAI,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,CAAC,CAAC,CAAC,EAAE,CAAC,GAAG,WAAW,CAAC,IAAI,EAAE,QAAQ,CAAC,KAAK,CAAC,CAAA;IAErH,sGAAsG;IACtG,mFAAmF;IACnF,QAAQ,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC,KAAK,EAAE,EAAE;QACnC,IAAI,CAAC,QAAQ,CAAC,GAAG,CAAC,KAAK,CAAC,CAAA;QACxB,KAAK,CAAC,OAAO,CAAC,GAAG,CAAC,IAAI,CAAC,CAAA;IACxB,CAAC,CAAC,CAAA;IAEF,IAAI,CAAC,QAAQ,CAAC,GAAG,CAAC,WAAW,CAAC,CAAA;IAC9B,WAAW,CAAC,OAAO,CAAC,GAAG,CAAC,IAAI,CAAC,CAAA;IAE7B,MAAM,OAAO,GAAG,IAAI,CAAC,IAAI,KAAK,WAAW,CAAC,IAAI,CAAA;IAC9C,MAAM,MAAM,GAAG,CAAC,WAAW,CAAC,WAAW,CAAA;IAEvC,IAAI,OAAO,EAAE,CAAC;QACb,IAAI,CAAC,KAAK,GAAG,WAAW,CAAC,KAAK,CAAA;QAC9B,IAAI,CAAC,GAAG,GAAG,WAAW,CAAC,GAAG,CAAA;IAC3B,CAAC;SAAM,CAAC;QACP,IAAI,WAAW,CAAC,KAAK,GAAG,IAAI,CAAC,KAAK,EAAE,CAAC;YACpC,IAAI,CAAC,KAAK,GAAG,WAAW,CAAC,KAAK,CAAA;QAC/B,CAAC;QAED,IAAI,WAAW,CAAC,GAAG,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC;YAChC,IAAI,CAAC,GAAG,GAAG,WAAW,CAAC,GAAG,CAAA;QAC3B,CAAC;IACF,CAAC;IAED,yDAAyD;IACzD,IAAI,CAAC,MAAM,EAAE,CAAC;QACb,WAAW,CAAC,YAAY,CAAC,OAAO,CAAC,CAAC,IAAI,EAAE,EAAE;YACzC,YAAY,CAAC,IAAI,EAAE,IAAI,EAAE,SAAS,GAAG,CAAC,EAAE,SAAS,EAAE,SAAS,EAAE,YAAY,CAAC,CAAA;QAC5E,CAAC,CAAC,CAAA;IACH,CAAC;IAED,IAAI,SAAS,IAAI,SAAS,EAAE,CAAC;QAC5B,YAAY,CAAC,IAAI,CAAC,IAAI,CAAC,CAAA;IACxB,CAAC;AACF,CAAC;AAcD;;;;;;;;;;GAUG;AACH,MAAM,UAAU,SAAS,CAAC,KAAqB,EAAE,EAAE,IAAI,EAAE,EAAE,EAAoB;IAC9E,MAAM,YAAY,GAAW,EAAE,CAAA;IAE/B,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;QAC1B,YAAY,CAAC,IAAI,IAAI,EAAE,EAAE,IAAI,EAAE,CAAC,EAAE,IAAI,EAAE,EAAE,EAAE,YAAY,CAAC,CAAA;IAC1D,CAAC;IAED,OAAO,YAAY,CAAA;AACpB,CAAC"}
|
|
@@ -0,0 +1,22 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
import { Span } from "./Span.js";
|
|
7
|
+
type FieldMatchPredicate = (char: string) => boolean;
|
|
8
|
+
export declare function splitByField(span: Span, predicate: FieldMatchPredicate): Span[];
|
|
9
|
+
/**
|
|
10
|
+
* Predicate to test if a character is a field boundary
|
|
11
|
+
*/
|
|
12
|
+
export declare const fieldsFuncBoundary: FieldMatchPredicate;
|
|
13
|
+
/**
|
|
14
|
+
* Predicate to test if a character is a field whitespace.
|
|
15
|
+
*/
|
|
16
|
+
export declare const fieldsFuncWhiteSpace: FieldMatchPredicate;
|
|
17
|
+
/**
|
|
18
|
+
* Predicate to test if a character is a hyphen or whitespace.
|
|
19
|
+
*/
|
|
20
|
+
export declare const fieldsFuncHyphenOrWhiteSpace: FieldMatchPredicate;
|
|
21
|
+
export {};
|
|
22
|
+
//# sourceMappingURL=split.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"split.d.ts","sourceRoot":"","sources":["../../tokenization/split.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,EAAE,IAAI,EAAE,MAAM,WAAW,CAAA;AAEhC,KAAK,mBAAmB,GAAG,CAAC,IAAI,EAAE,MAAM,KAAK,OAAO,CAAA;AAEpD,wBAAgB,YAAY,CAAC,IAAI,EAAE,IAAI,EAAE,SAAS,EAAE,mBAAmB,GAAG,IAAI,EAAE,CA8C/E;AAKD;;GAEG;AACH,eAAO,MAAM,kBAAkB,EAAE,mBAGhC,CAAA;AAED;;GAEG;AACH,eAAO,MAAM,oBAAoB,EAAE,mBAElC,CAAA;AAED;;GAEG;AACH,eAAO,MAAM,4BAA4B,EAAE,mBAE1C,CAAA"}
|
|
@@ -0,0 +1,63 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
import { Span } from "./Span.js";
|
|
7
|
+
export function splitByField(span, predicate) {
|
|
8
|
+
// A span is used to record a slice of s of the form s[start:end].
|
|
9
|
+
// The start index is inclusive and the end index is exclusive.
|
|
10
|
+
const spans = [];
|
|
11
|
+
// Find the field start and end indices.
|
|
12
|
+
let wasField = false;
|
|
13
|
+
let fromIndex = 0;
|
|
14
|
+
// Iterate unicode code points in string
|
|
15
|
+
for (let i = 0; i < span.body.length; i++) {
|
|
16
|
+
const char = span.body.charAt(i);
|
|
17
|
+
if (predicate(char)) {
|
|
18
|
+
if (wasField) {
|
|
19
|
+
let appendedChild = Iterator.from(span.children).find((child) => {
|
|
20
|
+
return child.start === span.start + fromIndex && child.body === span.body.substring(fromIndex, i);
|
|
21
|
+
});
|
|
22
|
+
appendedChild ||= Span.from(span.body.substring(fromIndex, i), {
|
|
23
|
+
start: span.start + fromIndex,
|
|
24
|
+
});
|
|
25
|
+
spans.push(appendedChild);
|
|
26
|
+
wasField = false;
|
|
27
|
+
}
|
|
28
|
+
}
|
|
29
|
+
else if (!wasField) {
|
|
30
|
+
fromIndex = i;
|
|
31
|
+
wasField = true;
|
|
32
|
+
}
|
|
33
|
+
}
|
|
34
|
+
// Last field might end at EOF.
|
|
35
|
+
if (wasField) {
|
|
36
|
+
spans.push(Iterator.from(span.children).find((s) => s.start === span.start + fromIndex && s.body === span.body.substring(fromIndex, span.body.length)) || Span.from(span.body.substring(fromIndex, span.body.length), { start: span.start + fromIndex }));
|
|
37
|
+
}
|
|
38
|
+
// Add siblings to graph
|
|
39
|
+
Span.connectSiblings(...spans);
|
|
40
|
+
return spans;
|
|
41
|
+
}
|
|
42
|
+
const quotes = '"«»‘’‚‛“”„‟‹›⹂「」『』〝〞〟﹁﹂﹃﹄"'「」';
|
|
43
|
+
const fieldBoundaryPattern = /\n|\t|,/;
|
|
44
|
+
/**
|
|
45
|
+
* Predicate to test if a character is a field boundary
|
|
46
|
+
*/
|
|
47
|
+
export const fieldsFuncBoundary = (char) => {
|
|
48
|
+
// TODO: this should ideally only work for 'matching pairs' of quotes.
|
|
49
|
+
return fieldBoundaryPattern.test(char) || quotes.includes(char);
|
|
50
|
+
};
|
|
51
|
+
/**
|
|
52
|
+
* Predicate to test if a character is a field whitespace.
|
|
53
|
+
*/
|
|
54
|
+
export const fieldsFuncWhiteSpace = (char) => {
|
|
55
|
+
return char.trim().length === 0;
|
|
56
|
+
};
|
|
57
|
+
/**
|
|
58
|
+
* Predicate to test if a character is a hyphen or whitespace.
|
|
59
|
+
*/
|
|
60
|
+
export const fieldsFuncHyphenOrWhiteSpace = (char) => {
|
|
61
|
+
return char === "-" || char === "/" || fieldsFuncWhiteSpace(char);
|
|
62
|
+
};
|
|
63
|
+
//# sourceMappingURL=split.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"split.js","sourceRoot":"","sources":["../../tokenization/split.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,EAAE,IAAI,EAAE,MAAM,WAAW,CAAA;AAIhC,MAAM,UAAU,YAAY,CAAC,IAAU,EAAE,SAA8B;IACtE,kEAAkE;IAClE,+DAA+D;IAC/D,MAAM,KAAK,GAAW,EAAE,CAAA;IAExB,wCAAwC;IACxC,IAAI,QAAQ,GAAG,KAAK,CAAA;IACpB,IAAI,SAAS,GAAG,CAAC,CAAA;IAEjB,wCAAwC;IACxC,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,IAAI,CAAC,IAAI,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;QAC3C,MAAM,IAAI,GAAG,IAAI,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC,CAAC,CAAA;QAEhC,IAAI,SAAS,CAAC,IAAI,CAAC,EAAE,CAAC;YACrB,IAAI,QAAQ,EAAE,CAAC;gBACd,IAAI,aAAa,GAAG,QAAQ,CAAC,IAAI,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE;oBAC/D,OAAO,KAAK,CAAC,KAAK,KAAK,IAAI,CAAC,KAAK,GAAG,SAAS,IAAI,KAAK,CAAC,IAAI,KAAK,IAAI,CAAC,IAAI,CAAC,SAAS,CAAC,SAAS,EAAE,CAAC,CAAC,CAAA;gBAClG,CAAC,CAAC,CAAA;gBAEF,aAAa,KAAK,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,SAAS,CAAC,SAAS,EAAE,CAAC,CAAC,EAAE;oBAC9D,KAAK,EAAE,IAAI,CAAC,KAAK,GAAG,SAAS;iBAC7B,CAAC,CAAA;gBAEF,KAAK,CAAC,IAAI,CAAC,aAAa,CAAC,CAAA;gBAEzB,QAAQ,GAAG,KAAK,CAAA;YACjB,CAAC;QACF,CAAC;aAAM,IAAI,CAAC,QAAQ,EAAE,CAAC;YACtB,SAAS,GAAG,CAAC,CAAA;YACb,QAAQ,GAAG,IAAI,CAAA;QAChB,CAAC;IACF,CAAC;IAED,+BAA+B;IAC/B,IAAI,QAAQ,EAAE,CAAC;QACd,KAAK,CAAC,IAAI,CACT,QAAQ,CAAC,IAAI,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC,IAAI,CAChC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,KAAK,KAAK,IAAI,CAAC,KAAK,GAAG,SAAS,IAAI,CAAC,CAAC,IAAI,KAAK,IAAI,CAAC,IAAI,CAAC,SAAS,CAAC,SAAS,EAAE,IAAI,CAAC,IAAI,CAAC,MAAM,CAAC,CACxG,IAAI,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,SAAS,CAAC,SAAS,EAAE,IAAI,CAAC,IAAI,CAAC,MAAM,CAAC,EAAE,EAAE,KAAK,EAAE,IAAI,CAAC,KAAK,GAAG,SAAS,EAAE,CAAC,CACnG,CAAA;IACF,CAAC;IAED,wBAAwB;IACxB,IAAI,CAAC,eAAe,CAAC,GAAG,KAAK,CAAC,CAAA;IAE9B,OAAO,KAAK,CAAA;AACb,CAAC;AAED,MAAM,MAAM,GAAG,+BAA+B,CAAA;AAC9C,MAAM,oBAAoB,GAAG,SAAS,CAAA;AAEtC;;GAEG;AACH,MAAM,CAAC,MAAM,kBAAkB,GAAwB,CAAC,IAAI,EAAE,EAAE;IAC/D,sEAAsE;IACtE,OAAO,oBAAoB,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,MAAM,CAAC,QAAQ,CAAC,IAAI,CAAC,CAAA;AAChE,CAAC,CAAA;AAED;;GAEG;AACH,MAAM,CAAC,MAAM,oBAAoB,GAAwB,CAAC,IAAI,EAAE,EAAE;IACjE,OAAO,IAAI,CAAC,IAAI,EAAE,CAAC,MAAM,KAAK,CAAC,CAAA;AAChC,CAAC,CAAA;AAED;;GAEG;AACH,MAAM,CAAC,MAAM,4BAA4B,GAAwB,CAAC,IAAI,EAAE,EAAE;IACzE,OAAO,IAAI,KAAK,GAAG,IAAI,IAAI,KAAK,GAAG,IAAI,oBAAoB,CAAC,IAAI,CAAC,CAAA;AAClE,CAAC,CAAA"}
|
|
@@ -0,0 +1,117 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*
|
|
6
|
+
* Classifier-side contracts for the neural integration (per #6).
|
|
7
|
+
*
|
|
8
|
+
* These interfaces are deliberately distinct from the existing `Classifier` shape in
|
|
9
|
+
* `../classification/BaseClassifier.ts`. The legacy shape is mutation-based —
|
|
10
|
+
* `classifyTokens(context): void` — and runs synchronously over the span graph. The shape
|
|
11
|
+
* declared here is pull-based and async: a classifier returns a list of `ClassificationProposal`
|
|
12
|
+
* objects keyed by the canonical `ComponentTag` union.
|
|
13
|
+
*
|
|
14
|
+
* Both shapes co-exist during the Ship-of-Theseus rollout. Rule classifiers are wrapped via
|
|
15
|
+
* `wrapLegacyClassifier` (see `@mailwoman/classifiers`); the neural classifier (Phase 3)
|
|
16
|
+
* implements this interface natively. The solver consumes one normalized shape.
|
|
17
|
+
*/
|
|
18
|
+
import type { Span } from "../tokenization/index.js";
|
|
19
|
+
import type { ComponentTag } from "./component.js";
|
|
20
|
+
/**
|
|
21
|
+
* Sections in Mailwoman are sub-Spans of the tokenized input (split by boundary characters: commas,
|
|
22
|
+
* line breaks, etc.). They are surfaced as `Span` instances in `TokenContext.sections`; this alias
|
|
23
|
+
* documents the call-site intent.
|
|
24
|
+
*/
|
|
25
|
+
export type Section = Span;
|
|
26
|
+
/**
|
|
27
|
+
* Source of a `ClassificationProposal`. Drives policy decisions and downstream telemetry.
|
|
28
|
+
*
|
|
29
|
+
* - `rule`: emitted by a legacy rule classifier through the adapter.
|
|
30
|
+
* - `neural`: emitted by an ONNX-backed sequence classifier.
|
|
31
|
+
* - `merged`: synthetic source for a merger that fused proposals from multiple classifiers (rare;
|
|
32
|
+
* mostly for telemetry on `merged` ids).
|
|
33
|
+
*/
|
|
34
|
+
export type ClassificationProposalSource = "rule" | "neural" | "merged";
|
|
35
|
+
/**
|
|
36
|
+
* A typed classification candidate produced by any classifier.
|
|
37
|
+
*
|
|
38
|
+
* Mirrors Mailwoman's pre-refactor per-component output shape with the addition of `source` and
|
|
39
|
+
* `source_id` so downstream code can identify the origin of each proposal without consulting
|
|
40
|
+
* external state.
|
|
41
|
+
*/
|
|
42
|
+
export interface ClassificationProposal {
|
|
43
|
+
/** Span this proposal applies to. */
|
|
44
|
+
span: Span;
|
|
45
|
+
/** Component type the classifier thinks this span is. */
|
|
46
|
+
component: ComponentTag;
|
|
47
|
+
/** Classifier confidence in [0, 1]. */
|
|
48
|
+
confidence: number;
|
|
49
|
+
/** Provenance — which classifier family produced this proposal. */
|
|
50
|
+
source: ClassificationProposalSource;
|
|
51
|
+
/**
|
|
52
|
+
* Identifier of the specific classifier instance. Rule wrappers use the legacy classifier's
|
|
53
|
+
* stable id (e.g. `house_number`, `postcode`, `whos_on_first`). Neural classifiers use a
|
|
54
|
+
* versioned model id like `neural-v0.3.1-en-us`.
|
|
55
|
+
*/
|
|
56
|
+
source_id: string;
|
|
57
|
+
/**
|
|
58
|
+
* Solver penalty applied to this proposal. Higher penalty makes the proposal less likely to
|
|
59
|
+
* appear in the winning solution.
|
|
60
|
+
*/
|
|
61
|
+
penalty: number;
|
|
62
|
+
/**
|
|
63
|
+
* Opaque metadata for debugging and telemetry. Never consulted by the solver. Common keys:
|
|
64
|
+
* `languages`, `flags`, `legacyClassification`.
|
|
65
|
+
*/
|
|
66
|
+
metadata?: Record<string, unknown>;
|
|
67
|
+
}
|
|
68
|
+
/**
|
|
69
|
+
* Per-request context handed to a classifier.
|
|
70
|
+
*/
|
|
71
|
+
export interface ClassifierContext {
|
|
72
|
+
/** Locale for this classification request, if known. */
|
|
73
|
+
locale?: string;
|
|
74
|
+
/** Proposals already produced for this request (for composites). */
|
|
75
|
+
prior?: readonly ClassificationProposal[];
|
|
76
|
+
/** Cancellation signal. */
|
|
77
|
+
signal?: AbortSignal;
|
|
78
|
+
}
|
|
79
|
+
/**
|
|
80
|
+
* Plug-in contract every classifier implements.
|
|
81
|
+
*
|
|
82
|
+
* Construction must be cheap; per-classification work runs in {@link classify}. Pre-flight work
|
|
83
|
+
* (loading dictionaries, warming up an ONNX session) belongs in the optional `ready()` step.
|
|
84
|
+
*/
|
|
85
|
+
export interface ProposalClassifier {
|
|
86
|
+
/** Stable identifier. Used as `source_id` on emitted proposals. */
|
|
87
|
+
readonly id: string;
|
|
88
|
+
/**
|
|
89
|
+
* Components this classifier may emit. Enforced — proposals for tags outside this list are
|
|
90
|
+
* dropped by the adapter with a warning.
|
|
91
|
+
*/
|
|
92
|
+
readonly emits: readonly ComponentTag[];
|
|
93
|
+
/**
|
|
94
|
+
* Locales this classifier serves. `"*"` means locale-agnostic.
|
|
95
|
+
*
|
|
96
|
+
* The policy layer uses this to skip classifiers that aren't relevant to the requested locale.
|
|
97
|
+
*/
|
|
98
|
+
readonly locales: readonly (string | "*")[];
|
|
99
|
+
/** Optional async pre-flight. */
|
|
100
|
+
ready?(): Promise<void>;
|
|
101
|
+
/**
|
|
102
|
+
* Classify a section. Implementations MUST NOT throw — return an empty array on failure and log
|
|
103
|
+
* via the project logger.
|
|
104
|
+
*/
|
|
105
|
+
classify(section: Section, context: ClassifierContext): Promise<ClassificationProposal[]>;
|
|
106
|
+
}
|
|
107
|
+
/**
|
|
108
|
+
* Convenience: synchronous classifier (legacy rule wrappers usually fit here). The adapter wraps
|
|
109
|
+
* these into the async `ProposalClassifier` interface so the solver path stays uniform.
|
|
110
|
+
*/
|
|
111
|
+
export interface SyncProposalClassifier {
|
|
112
|
+
readonly id: string;
|
|
113
|
+
readonly emits: readonly ComponentTag[];
|
|
114
|
+
readonly locales: readonly (string | "*")[];
|
|
115
|
+
classifySync(section: Section, context: ClassifierContext): ClassificationProposal[];
|
|
116
|
+
}
|
|
117
|
+
//# sourceMappingURL=classifier.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"classifier.d.ts","sourceRoot":"","sources":["../../types/classifier.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;;;;;;GAgBG;AAEH,OAAO,KAAK,EAAE,IAAI,EAAE,MAAM,0BAA0B,CAAA;AACpD,OAAO,KAAK,EAAE,YAAY,EAAE,MAAM,gBAAgB,CAAA;AAElD;;;;GAIG;AACH,MAAM,MAAM,OAAO,GAAG,IAAI,CAAA;AAE1B;;;;;;;GAOG;AACH,MAAM,MAAM,4BAA4B,GAAG,MAAM,GAAG,QAAQ,GAAG,QAAQ,CAAA;AAEvE;;;;;;GAMG;AACH,MAAM,WAAW,sBAAsB;IACtC,qCAAqC;IACrC,IAAI,EAAE,IAAI,CAAA;IAEV,yDAAyD;IACzD,SAAS,EAAE,YAAY,CAAA;IAEvB,uCAAuC;IACvC,UAAU,EAAE,MAAM,CAAA;IAElB,mEAAmE;IACnE,MAAM,EAAE,4BAA4B,CAAA;IAEpC;;;;OAIG;IACH,SAAS,EAAE,MAAM,CAAA;IAEjB;;;OAGG;IACH,OAAO,EAAE,MAAM,CAAA;IAEf;;;OAGG;IACH,QAAQ,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAA;CAClC;AAED;;GAEG;AACH,MAAM,WAAW,iBAAiB;IACjC,wDAAwD;IACxD,MAAM,CAAC,EAAE,MAAM,CAAA;IAEf,oEAAoE;IACpE,KAAK,CAAC,EAAE,SAAS,sBAAsB,EAAE,CAAA;IAEzC,2BAA2B;IAC3B,MAAM,CAAC,EAAE,WAAW,CAAA;CACpB;AAED;;;;;GAKG;AACH,MAAM,WAAW,kBAAkB;IAClC,mEAAmE;IACnE,QAAQ,CAAC,EAAE,EAAE,MAAM,CAAA;IAEnB;;;OAGG;IACH,QAAQ,CAAC,KAAK,EAAE,SAAS,YAAY,EAAE,CAAA;IAEvC;;;;OAIG;IACH,QAAQ,CAAC,OAAO,EAAE,SAAS,CAAC,MAAM,GAAG,GAAG,CAAC,EAAE,CAAA;IAE3C,iCAAiC;IACjC,KAAK,CAAC,IAAI,OAAO,CAAC,IAAI,CAAC,CAAA;IAEvB;;;OAGG;IACH,QAAQ,CAAC,OAAO,EAAE,OAAO,EAAE,OAAO,EAAE,iBAAiB,GAAG,OAAO,CAAC,sBAAsB,EAAE,CAAC,CAAA;CACzF;AAED;;;GAGG;AACH,MAAM,WAAW,sBAAsB;IACtC,QAAQ,CAAC,EAAE,EAAE,MAAM,CAAA;IACnB,QAAQ,CAAC,KAAK,EAAE,SAAS,YAAY,EAAE,CAAA;IACvC,QAAQ,CAAC,OAAO,EAAE,SAAS,CAAC,MAAM,GAAG,GAAG,CAAC,EAAE,CAAA;IAC3C,YAAY,CAAC,OAAO,EAAE,OAAO,EAAE,OAAO,EAAE,iBAAiB,GAAG,sBAAsB,EAAE,CAAA;CACpF"}
|
|
@@ -0,0 +1,19 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*
|
|
6
|
+
* Classifier-side contracts for the neural integration (per #6).
|
|
7
|
+
*
|
|
8
|
+
* These interfaces are deliberately distinct from the existing `Classifier` shape in
|
|
9
|
+
* `../classification/BaseClassifier.ts`. The legacy shape is mutation-based —
|
|
10
|
+
* `classifyTokens(context): void` — and runs synchronously over the span graph. The shape
|
|
11
|
+
* declared here is pull-based and async: a classifier returns a list of `ClassificationProposal`
|
|
12
|
+
* objects keyed by the canonical `ComponentTag` union.
|
|
13
|
+
*
|
|
14
|
+
* Both shapes co-exist during the Ship-of-Theseus rollout. Rule classifiers are wrapped via
|
|
15
|
+
* `wrapLegacyClassifier` (see `@mailwoman/classifiers`); the neural classifier (Phase 3)
|
|
16
|
+
* implements this interface natively. The solver consumes one normalized shape.
|
|
17
|
+
*/
|
|
18
|
+
export {};
|
|
19
|
+
//# sourceMappingURL=classifier.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"classifier.js","sourceRoot":"","sources":["../../types/classifier.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;;;;;;GAgBG"}
|
|
@@ -0,0 +1,42 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*
|
|
6
|
+
* Canonical address component schema for the neural classifier pipeline.
|
|
7
|
+
*
|
|
8
|
+
* This file is the single source of truth for `ComponentTag`. Any change here requires (per #5 of
|
|
9
|
+
* the Mailwoman Neural plan):
|
|
10
|
+
*
|
|
11
|
+
* 1. A written rationale in the commit message.
|
|
12
|
+
* 2. A migration plan for corpus rows tagged with the prior schema.
|
|
13
|
+
* 3. A same-commit check that alignment, training, and inference code is updated to match.
|
|
14
|
+
*
|
|
15
|
+
* The legacy `Classifications` set in `../classification/scheme.ts` is kept independent on purpose:
|
|
16
|
+
* rule classifiers continue to emit those, the neural classifier emits these. The bridge between
|
|
17
|
+
* the two lives in the adapter layer (see #6).
|
|
18
|
+
*/
|
|
19
|
+
/**
|
|
20
|
+
* The canonical address component tag union, ordered by phase and locale.
|
|
21
|
+
*
|
|
22
|
+
* - Universal (Phase 1): country, region, locality, dependent_locality, postcode, subregion
|
|
23
|
+
* - Street-level (Phase 2): house_number, street, street_prefix*, street_suffix, intersection_a/b,
|
|
24
|
+
* unit
|
|
25
|
+
* - Venue-level (Phase 3): venue, attention, po_box
|
|
26
|
+
* - FR-specific: cedex
|
|
27
|
+
* - JP-specific (Phase 6, declared but unused before then): prefecture, municipality, district,
|
|
28
|
+
* block, sub_block, building_number, building_name
|
|
29
|
+
*/
|
|
30
|
+
export declare const COMPONENT_TAGS: readonly ["country", "region", "locality", "dependent_locality", "postcode", "subregion", "house_number", "street", "street_prefix", "street_prefix_particle", "street_suffix", "intersection_a", "intersection_b", "unit", "venue", "attention", "po_box", "cedex", "prefecture", "municipality", "district", "block", "sub_block", "building_number", "building_name"];
|
|
31
|
+
/** Union of every recognized address component tag. */
|
|
32
|
+
export type ComponentTag = (typeof COMPONENT_TAGS)[number];
|
|
33
|
+
/**
|
|
34
|
+
* BIO-encoded label set: one `O` plus a `B-` / `I-` pair per tag.
|
|
35
|
+
*
|
|
36
|
+
* Used as the per-token output alphabet for the sequence-labeling neural model. Inference decodes a
|
|
37
|
+
* stream of these back into character-aligned `ClassificationProposal`s.
|
|
38
|
+
*/
|
|
39
|
+
export declare const BIO_LABELS: readonly ["O", ...("B-country" | "B-house_number" | "B-locality" | "B-postcode" | "B-region" | "B-street_prefix" | "B-street_suffix" | "B-street" | "B-unit" | "B-venue" | "B-attention" | "B-municipality" | "B-district" | "B-dependent_locality" | "B-subregion" | "B-street_prefix_particle" | "B-intersection_a" | "B-intersection_b" | "B-po_box" | "B-cedex" | "B-prefecture" | "B-block" | "B-sub_block" | "B-building_number" | "B-building_name" | "I-country" | "I-house_number" | "I-locality" | "I-postcode" | "I-region" | "I-street_prefix" | "I-street_suffix" | "I-street" | "I-unit" | "I-venue" | "I-attention" | "I-municipality" | "I-district" | "I-dependent_locality" | "I-subregion" | "I-street_prefix_particle" | "I-intersection_a" | "I-intersection_b" | "I-po_box" | "I-cedex" | "I-prefecture" | "I-block" | "I-sub_block" | "I-building_number" | "I-building_name")[]];
|
|
40
|
+
/** Union of every BIO label. */
|
|
41
|
+
export type BioLabel = (typeof BIO_LABELS)[number];
|
|
42
|
+
//# sourceMappingURL=component.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"component.d.ts","sourceRoot":"","sources":["../../types/component.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;;;;;;;GAiBG;AAEH;;;;;;;;;;GAUG;AACH,eAAO,MAAM,cAAc,0WA+BjB,CAAA;AAEV,uDAAuD;AACvD,MAAM,MAAM,YAAY,GAAG,CAAC,OAAO,cAAc,CAAC,CAAC,MAAM,CAAC,CAAA;AAE1D;;;;;GAKG;AACH,eAAO,MAAM,UAAU,02BAAwF,CAAA;AAE/G,gCAAgC;AAChC,MAAM,MAAM,QAAQ,GAAG,CAAC,OAAO,UAAU,CAAC,CAAC,MAAM,CAAC,CAAA"}
|
|
@@ -0,0 +1,69 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*
|
|
6
|
+
* Canonical address component schema for the neural classifier pipeline.
|
|
7
|
+
*
|
|
8
|
+
* This file is the single source of truth for `ComponentTag`. Any change here requires (per #5 of
|
|
9
|
+
* the Mailwoman Neural plan):
|
|
10
|
+
*
|
|
11
|
+
* 1. A written rationale in the commit message.
|
|
12
|
+
* 2. A migration plan for corpus rows tagged with the prior schema.
|
|
13
|
+
* 3. A same-commit check that alignment, training, and inference code is updated to match.
|
|
14
|
+
*
|
|
15
|
+
* The legacy `Classifications` set in `../classification/scheme.ts` is kept independent on purpose:
|
|
16
|
+
* rule classifiers continue to emit those, the neural classifier emits these. The bridge between
|
|
17
|
+
* the two lives in the adapter layer (see #6).
|
|
18
|
+
*/
|
|
19
|
+
/**
|
|
20
|
+
* The canonical address component tag union, ordered by phase and locale.
|
|
21
|
+
*
|
|
22
|
+
* - Universal (Phase 1): country, region, locality, dependent_locality, postcode, subregion
|
|
23
|
+
* - Street-level (Phase 2): house_number, street, street_prefix*, street_suffix, intersection_a/b,
|
|
24
|
+
* unit
|
|
25
|
+
* - Venue-level (Phase 3): venue, attention, po_box
|
|
26
|
+
* - FR-specific: cedex
|
|
27
|
+
* - JP-specific (Phase 6, declared but unused before then): prefecture, municipality, district,
|
|
28
|
+
* block, sub_block, building_number, building_name
|
|
29
|
+
*/
|
|
30
|
+
export const COMPONENT_TAGS = [
|
|
31
|
+
// Universal
|
|
32
|
+
"country",
|
|
33
|
+
"region",
|
|
34
|
+
"locality",
|
|
35
|
+
"dependent_locality",
|
|
36
|
+
"postcode",
|
|
37
|
+
"subregion",
|
|
38
|
+
// Street-level
|
|
39
|
+
"house_number",
|
|
40
|
+
"street",
|
|
41
|
+
"street_prefix",
|
|
42
|
+
"street_prefix_particle",
|
|
43
|
+
"street_suffix",
|
|
44
|
+
"intersection_a",
|
|
45
|
+
"intersection_b",
|
|
46
|
+
"unit",
|
|
47
|
+
// Venue-level
|
|
48
|
+
"venue",
|
|
49
|
+
"attention",
|
|
50
|
+
"po_box",
|
|
51
|
+
// FR-specific
|
|
52
|
+
"cedex",
|
|
53
|
+
// JP-specific (Phase 6 — declared but unused until then)
|
|
54
|
+
"prefecture",
|
|
55
|
+
"municipality",
|
|
56
|
+
"district",
|
|
57
|
+
"block",
|
|
58
|
+
"sub_block",
|
|
59
|
+
"building_number",
|
|
60
|
+
"building_name",
|
|
61
|
+
];
|
|
62
|
+
/**
|
|
63
|
+
* BIO-encoded label set: one `O` plus a `B-` / `I-` pair per tag.
|
|
64
|
+
*
|
|
65
|
+
* Used as the per-token output alphabet for the sequence-labeling neural model. Inference decodes a
|
|
66
|
+
* stream of these back into character-aligned `ClassificationProposal`s.
|
|
67
|
+
*/
|
|
68
|
+
export const BIO_LABELS = ["O", ...COMPONENT_TAGS.flatMap((tag) => [`B-${tag}`, `I-${tag}`])];
|
|
69
|
+
//# sourceMappingURL=component.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"component.js","sourceRoot":"","sources":["../../types/component.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;;;;;;;GAiBG;AAEH;;;;;;;;;;GAUG;AACH,MAAM,CAAC,MAAM,cAAc,GAAG;IAC7B,YAAY;IACZ,SAAS;IACT,QAAQ;IACR,UAAU;IACV,oBAAoB;IACpB,UAAU;IACV,WAAW;IACX,eAAe;IACf,cAAc;IACd,QAAQ;IACR,eAAe;IACf,wBAAwB;IACxB,eAAe;IACf,gBAAgB;IAChB,gBAAgB;IAChB,MAAM;IACN,cAAc;IACd,OAAO;IACP,WAAW;IACX,QAAQ;IACR,cAAc;IACd,OAAO;IACP,yDAAyD;IACzD,YAAY;IACZ,cAAc;IACd,UAAU;IACV,OAAO;IACP,WAAW;IACX,iBAAiB;IACjB,eAAe;CACN,CAAA;AAKV;;;;;GAKG;AACH,MAAM,CAAC,MAAM,UAAU,GAAG,CAAC,GAAG,EAAE,GAAG,cAAc,CAAC,OAAO,CAAC,CAAC,GAAG,EAAE,EAAE,CAAC,CAAC,KAAK,GAAG,EAAE,EAAE,KAAK,GAAG,EAAE,CAAU,CAAC,CAAU,CAAA"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../types/index.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,cAAc,iBAAiB,CAAA;AAC/B,cAAc,gBAAgB,CAAA;AAC9B,cAAc,cAAc,CAAA"}
|