@mailwoman/core 2.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/data/chromium-i18n/ssl-address/AC.json +8 -0
- package/data/chromium-i18n/ssl-address/AD.json +16 -0
- package/data/chromium-i18n/ssl-address/AE.json +15 -0
- package/data/chromium-i18n/ssl-address/AF.json +8 -0
- package/data/chromium-i18n/ssl-address/AG.json +1 -0
- package/data/chromium-i18n/ssl-address/AI.json +8 -0
- package/data/chromium-i18n/ssl-address/AL.json +8 -0
- package/data/chromium-i18n/ssl-address/AM.json +16 -0
- package/data/chromium-i18n/ssl-address/AO.json +1 -0
- package/data/chromium-i18n/ssl-address/AQ.json +1 -0
- package/data/chromium-i18n/ssl-address/AR.json +16 -0
- package/data/chromium-i18n/ssl-address/AS.json +13 -0
- package/data/chromium-i18n/ssl-address/AT.json +10 -0
- package/data/chromium-i18n/ssl-address/AU.json +20 -0
- package/data/chromium-i18n/ssl-address/AW.json +1 -0
- package/data/chromium-i18n/ssl-address/AX.json +11 -0
- package/data/chromium-i18n/ssl-address/AZ.json +9 -0
- package/data/chromium-i18n/ssl-address/BA.json +8 -0
- package/data/chromium-i18n/ssl-address/BB.json +9 -0
- package/data/chromium-i18n/ssl-address/BD.json +9 -0
- package/data/chromium-i18n/ssl-address/BE.json +10 -0
- package/data/chromium-i18n/ssl-address/BF.json +6 -0
- package/data/chromium-i18n/ssl-address/BG.json +9 -0
- package/data/chromium-i18n/ssl-address/BH.json +8 -0
- package/data/chromium-i18n/ssl-address/BI.json +1 -0
- package/data/chromium-i18n/ssl-address/BJ.json +1 -0
- package/data/chromium-i18n/ssl-address/BL.json +11 -0
- package/data/chromium-i18n/ssl-address/BM.json +9 -0
- package/data/chromium-i18n/ssl-address/BN.json +9 -0
- package/data/chromium-i18n/ssl-address/BO.json +1 -0
- package/data/chromium-i18n/ssl-address/BQ.json +1 -0
- package/data/chromium-i18n/ssl-address/BR.json +21 -0
- package/data/chromium-i18n/ssl-address/BS.json +12 -0
- package/data/chromium-i18n/ssl-address/BT.json +9 -0
- package/data/chromium-i18n/ssl-address/BV.json +1 -0
- package/data/chromium-i18n/ssl-address/BW.json +1 -0
- package/data/chromium-i18n/ssl-address/BY.json +9 -0
- package/data/chromium-i18n/ssl-address/BZ.json +1 -0
- package/data/chromium-i18n/ssl-address/CA.json +17 -0
- package/data/chromium-i18n/ssl-address/CC.json +9 -0
- package/data/chromium-i18n/ssl-address/CD.json +1 -0
- package/data/chromium-i18n/ssl-address/CF.json +1 -0
- package/data/chromium-i18n/ssl-address/CG.json +1 -0
- package/data/chromium-i18n/ssl-address/CH.json +12 -0
- package/data/chromium-i18n/ssl-address/CI.json +6 -0
- package/data/chromium-i18n/ssl-address/CK.json +1 -0
- package/data/chromium-i18n/ssl-address/CL.json +15 -0
- package/data/chromium-i18n/ssl-address/CM.json +1 -0
- package/data/chromium-i18n/ssl-address/CN.json +22 -0
- package/data/chromium-i18n/ssl-address/CO.json +11 -0
- package/data/chromium-i18n/ssl-address/CR.json +10 -0
- package/data/chromium-i18n/ssl-address/CU.json +12 -0
- package/data/chromium-i18n/ssl-address/CV.json +13 -0
- package/data/chromium-i18n/ssl-address/CW.json +1 -0
- package/data/chromium-i18n/ssl-address/CX.json +9 -0
- package/data/chromium-i18n/ssl-address/CY.json +8 -0
- package/data/chromium-i18n/ssl-address/CZ.json +10 -0
- package/data/chromium-i18n/ssl-address/DE.json +10 -0
- package/data/chromium-i18n/ssl-address/DJ.json +1 -0
- package/data/chromium-i18n/ssl-address/DK.json +10 -0
- package/data/chromium-i18n/ssl-address/DM.json +1 -0
- package/data/chromium-i18n/ssl-address/DO.json +9 -0
- package/data/chromium-i18n/ssl-address/DZ.json +8 -0
- package/data/chromium-i18n/ssl-address/EC.json +10 -0
- package/data/chromium-i18n/ssl-address/EE.json +9 -0
- package/data/chromium-i18n/ssl-address/EG.json +16 -0
- package/data/chromium-i18n/ssl-address/EH.json +8 -0
- package/data/chromium-i18n/ssl-address/ER.json +1 -0
- package/data/chromium-i18n/ssl-address/ES.json +16 -0
- package/data/chromium-i18n/ssl-address/ET.json +8 -0
- package/data/chromium-i18n/ssl-address/FI.json +11 -0
- package/data/chromium-i18n/ssl-address/FJ.json +1 -0
- package/data/chromium-i18n/ssl-address/FK.json +10 -0
- package/data/chromium-i18n/ssl-address/FM.json +13 -0
- package/data/chromium-i18n/ssl-address/FO.json +10 -0
- package/data/chromium-i18n/ssl-address/FR.json +11 -0
- package/data/chromium-i18n/ssl-address/GA.json +1 -0
- package/data/chromium-i18n/ssl-address/GB.json +12 -0
- package/data/chromium-i18n/ssl-address/GD.json +1 -0
- package/data/chromium-i18n/ssl-address/GE.json +9 -0
- package/data/chromium-i18n/ssl-address/GF.json +11 -0
- package/data/chromium-i18n/ssl-address/GG.json +11 -0
- package/data/chromium-i18n/ssl-address/GH.json +1 -0
- package/data/chromium-i18n/ssl-address/GI.json +9 -0
- package/data/chromium-i18n/ssl-address/GL.json +9 -0
- package/data/chromium-i18n/ssl-address/GM.json +1 -0
- package/data/chromium-i18n/ssl-address/GN.json +8 -0
- package/data/chromium-i18n/ssl-address/GP.json +11 -0
- package/data/chromium-i18n/ssl-address/GQ.json +1 -0
- package/data/chromium-i18n/ssl-address/GR.json +10 -0
- package/data/chromium-i18n/ssl-address/GS.json +10 -0
- package/data/chromium-i18n/ssl-address/GT.json +8 -0
- package/data/chromium-i18n/ssl-address/GU.json +12 -0
- package/data/chromium-i18n/ssl-address/GW.json +8 -0
- package/data/chromium-i18n/ssl-address/GY.json +1 -0
- package/data/chromium-i18n/ssl-address/HK.json +16 -0
- package/data/chromium-i18n/ssl-address/HM.json +9 -0
- package/data/chromium-i18n/ssl-address/HN.json +9 -0
- package/data/chromium-i18n/ssl-address/HR.json +10 -0
- package/data/chromium-i18n/ssl-address/HT.json +9 -0
- package/data/chromium-i18n/ssl-address/HU.json +11 -0
- package/data/chromium-i18n/ssl-address/ID.json +13 -0
- package/data/chromium-i18n/ssl-address/IE.json +16 -0
- package/data/chromium-i18n/ssl-address/IL.json +9 -0
- package/data/chromium-i18n/ssl-address/IM.json +11 -0
- package/data/chromium-i18n/ssl-address/IN.json +18 -0
- package/data/chromium-i18n/ssl-address/IO.json +10 -0
- package/data/chromium-i18n/ssl-address/IQ.json +10 -0
- package/data/chromium-i18n/ssl-address/IR.json +14 -0
- package/data/chromium-i18n/ssl-address/IS.json +9 -0
- package/data/chromium-i18n/ssl-address/IT.json +17 -0
- package/data/chromium-i18n/ssl-address/JE.json +11 -0
- package/data/chromium-i18n/ssl-address/JM.json +12 -0
- package/data/chromium-i18n/ssl-address/JO.json +8 -0
- package/data/chromium-i18n/ssl-address/JP.json +19 -0
- package/data/chromium-i18n/ssl-address/KE.json +8 -0
- package/data/chromium-i18n/ssl-address/KG.json +8 -0
- package/data/chromium-i18n/ssl-address/KH.json +8 -0
- package/data/chromium-i18n/ssl-address/KI.json +8 -0
- package/data/chromium-i18n/ssl-address/KM.json +1 -0
- package/data/chromium-i18n/ssl-address/KN.json +12 -0
- package/data/chromium-i18n/ssl-address/KP.json +12 -0
- package/data/chromium-i18n/ssl-address/KR.json +23 -0
- package/data/chromium-i18n/ssl-address/KW.json +8 -0
- package/data/chromium-i18n/ssl-address/KY.json +14 -0
- package/data/chromium-i18n/ssl-address/KZ.json +8 -0
- package/data/chromium-i18n/ssl-address/LA.json +8 -0
- package/data/chromium-i18n/ssl-address/LB.json +8 -0
- package/data/chromium-i18n/ssl-address/LC.json +1 -0
- package/data/chromium-i18n/ssl-address/LI.json +11 -0
- package/data/chromium-i18n/ssl-address/LK.json +9 -0
- package/data/chromium-i18n/ssl-address/LR.json +8 -0
- package/data/chromium-i18n/ssl-address/LS.json +8 -0
- package/data/chromium-i18n/ssl-address/LT.json +10 -0
- package/data/chromium-i18n/ssl-address/LU.json +11 -0
- package/data/chromium-i18n/ssl-address/LV.json +9 -0
- package/data/chromium-i18n/ssl-address/LY.json +1 -0
- package/data/chromium-i18n/ssl-address/MA.json +8 -0
- package/data/chromium-i18n/ssl-address/MC.json +9 -0
- package/data/chromium-i18n/ssl-address/MD.json +9 -0
- package/data/chromium-i18n/ssl-address/ME.json +8 -0
- package/data/chromium-i18n/ssl-address/MF.json +11 -0
- package/data/chromium-i18n/ssl-address/MG.json +8 -0
- package/data/chromium-i18n/ssl-address/MH.json +13 -0
- package/data/chromium-i18n/ssl-address/MK.json +8 -0
- package/data/chromium-i18n/ssl-address/ML.json +1 -0
- package/data/chromium-i18n/ssl-address/MM.json +8 -0
- package/data/chromium-i18n/ssl-address/MN.json +9 -0
- package/data/chromium-i18n/ssl-address/MO.json +8 -0
- package/data/chromium-i18n/ssl-address/MP.json +13 -0
- package/data/chromium-i18n/ssl-address/MQ.json +11 -0
- package/data/chromium-i18n/ssl-address/MR.json +1 -0
- package/data/chromium-i18n/ssl-address/MS.json +1 -0
- package/data/chromium-i18n/ssl-address/MT.json +10 -0
- package/data/chromium-i18n/ssl-address/MU.json +9 -0
- package/data/chromium-i18n/ssl-address/MV.json +9 -0
- package/data/chromium-i18n/ssl-address/MW.json +1 -0
- package/data/chromium-i18n/ssl-address/MX.json +20 -0
- package/data/chromium-i18n/ssl-address/MY.json +19 -0
- package/data/chromium-i18n/ssl-address/MZ.json +12 -0
- package/data/chromium-i18n/ssl-address/NA.json +1 -0
- package/data/chromium-i18n/ssl-address/NC.json +11 -0
- package/data/chromium-i18n/ssl-address/NE.json +8 -0
- package/data/chromium-i18n/ssl-address/NF.json +9 -0
- package/data/chromium-i18n/ssl-address/NG.json +15 -0
- package/data/chromium-i18n/ssl-address/NI.json +16 -0
- package/data/chromium-i18n/ssl-address/NL.json +10 -0
- package/data/chromium-i18n/ssl-address/NO.json +11 -0
- package/data/chromium-i18n/ssl-address/NP.json +9 -0
- package/data/chromium-i18n/ssl-address/NR.json +12 -0
- package/data/chromium-i18n/ssl-address/NU.json +1 -0
- package/data/chromium-i18n/ssl-address/NZ.json +10 -0
- package/data/chromium-i18n/ssl-address/OM.json +8 -0
- package/data/chromium-i18n/ssl-address/PA.json +7 -0
- package/data/chromium-i18n/ssl-address/PE.json +14 -0
- package/data/chromium-i18n/ssl-address/PF.json +11 -0
- package/data/chromium-i18n/ssl-address/PG.json +9 -0
- package/data/chromium-i18n/ssl-address/PH.json +15 -0
- package/data/chromium-i18n/ssl-address/PK.json +9 -0
- package/data/chromium-i18n/ssl-address/PL.json +10 -0
- package/data/chromium-i18n/ssl-address/PM.json +10 -0
- package/data/chromium-i18n/ssl-address/PN.json +10 -0
- package/data/chromium-i18n/ssl-address/PR.json +13 -0
- package/data/chromium-i18n/ssl-address/PS.json +1 -0
- package/data/chromium-i18n/ssl-address/PT.json +10 -0
- package/data/chromium-i18n/ssl-address/PW.json +13 -0
- package/data/chromium-i18n/ssl-address/PY.json +8 -0
- package/data/chromium-i18n/ssl-address/QA.json +1 -0
- package/data/chromium-i18n/ssl-address/RE.json +11 -0
- package/data/chromium-i18n/ssl-address/RO.json +10 -0
- package/data/chromium-i18n/ssl-address/RS.json +9 -0
- package/data/chromium-i18n/ssl-address/RU.json +20 -0
- package/data/chromium-i18n/ssl-address/RW.json +1 -0
- package/data/chromium-i18n/ssl-address/SA.json +8 -0
- package/data/chromium-i18n/ssl-address/SB.json +1 -0
- package/data/chromium-i18n/ssl-address/SC.json +8 -0
- package/data/chromium-i18n/ssl-address/SD.json +9 -0
- package/data/chromium-i18n/ssl-address/SE.json +12 -0
- package/data/chromium-i18n/ssl-address/SG.json +10 -0
- package/data/chromium-i18n/ssl-address/SH.json +10 -0
- package/data/chromium-i18n/ssl-address/SI.json +9 -0
- package/data/chromium-i18n/ssl-address/SJ.json +11 -0
- package/data/chromium-i18n/ssl-address/SK.json +10 -0
- package/data/chromium-i18n/ssl-address/SL.json +1 -0
- package/data/chromium-i18n/ssl-address/SM.json +10 -0
- package/data/chromium-i18n/ssl-address/SN.json +8 -0
- package/data/chromium-i18n/ssl-address/SO.json +15 -0
- package/data/chromium-i18n/ssl-address/SR.json +11 -0
- package/data/chromium-i18n/ssl-address/SS.json +1 -0
- package/data/chromium-i18n/ssl-address/ST.json +1 -0
- package/data/chromium-i18n/ssl-address/SV.json +17 -0
- package/data/chromium-i18n/ssl-address/SX.json +1 -0
- package/data/chromium-i18n/ssl-address/SY.json +6 -0
- package/data/chromium-i18n/ssl-address/SZ.json +10 -0
- package/data/chromium-i18n/ssl-address/TA.json +8 -0
- package/data/chromium-i18n/ssl-address/TC.json +10 -0
- package/data/chromium-i18n/ssl-address/TD.json +1 -0
- package/data/chromium-i18n/ssl-address/TF.json +1 -0
- package/data/chromium-i18n/ssl-address/TG.json +1 -0
- package/data/chromium-i18n/ssl-address/TH.json +16 -0
- package/data/chromium-i18n/ssl-address/TJ.json +8 -0
- package/data/chromium-i18n/ssl-address/TK.json +1 -0
- package/data/chromium-i18n/ssl-address/TL.json +1 -0
- package/data/chromium-i18n/ssl-address/TM.json +8 -0
- package/data/chromium-i18n/ssl-address/TN.json +9 -0
- package/data/chromium-i18n/ssl-address/TO.json +1 -0
- package/data/chromium-i18n/ssl-address/TR.json +16 -0
- package/data/chromium-i18n/ssl-address/TT.json +1 -0
- package/data/chromium-i18n/ssl-address/TV.json +12 -0
- package/data/chromium-i18n/ssl-address/TW.json +20 -0
- package/data/chromium-i18n/ssl-address/TZ.json +8 -0
- package/data/chromium-i18n/ssl-address/UA.json +19 -0
- package/data/chromium-i18n/ssl-address/UG.json +1 -0
- package/data/chromium-i18n/ssl-address/UM.json +13 -0
- package/data/chromium-i18n/ssl-address/US.json +20 -0
- package/data/chromium-i18n/ssl-address/UY.json +15 -0
- package/data/chromium-i18n/ssl-address/UZ.json +10 -0
- package/data/chromium-i18n/ssl-address/VA.json +8 -0
- package/data/chromium-i18n/ssl-address/VC.json +9 -0
- package/data/chromium-i18n/ssl-address/VE.json +16 -0
- package/data/chromium-i18n/ssl-address/VG.json +9 -0
- package/data/chromium-i18n/ssl-address/VI.json +13 -0
- package/data/chromium-i18n/ssl-address/VN.json +15 -0
- package/data/chromium-i18n/ssl-address/VU.json +1 -0
- package/data/chromium-i18n/ssl-address/WF.json +10 -0
- package/data/chromium-i18n/ssl-address/WS.json +1 -0
- package/data/chromium-i18n/ssl-address/XK.json +8 -0
- package/data/chromium-i18n/ssl-address/YE.json +1 -0
- package/data/chromium-i18n/ssl-address/YT.json +10 -0
- package/data/chromium-i18n/ssl-address/ZA.json +10 -0
- package/data/chromium-i18n/ssl-address/ZM.json +8 -0
- package/data/chromium-i18n/ssl-address/ZW.json +1 -0
- package/data/chromium-i18n/ssl-address-download.sh +15 -0
- package/data/internal/dictionaries/languages.csv +184 -0
- package/data/internal/dictionaries/libpostal/af/personal_titles.txt +2 -0
- package/data/internal/dictionaries/libpostal/all/surnames.txt +1 -0
- package/data/internal/dictionaries/libpostal/de/academic_degrees.txt +7 -0
- package/data/internal/dictionaries/libpostal/de/concatenated_suffixes_separable.txt +3 -0
- package/data/internal/dictionaries/libpostal/de/near.txt +2 -0
- package/data/internal/dictionaries/libpostal/de/place_names.txt +11 -0
- package/data/internal/dictionaries/libpostal/de/stopwords.txt +1 -0
- package/data/internal/dictionaries/libpostal/de/street_types.txt +2 -0
- package/data/internal/dictionaries/libpostal/en/place_names.txt +7 -0
- package/data/internal/dictionaries/libpostal/en/road_types.txt +18 -0
- package/data/internal/dictionaries/libpostal/en/street_names.txt +2 -0
- package/data/internal/dictionaries/libpostal/en/street_types.txt +16 -0
- package/data/internal/dictionaries/libpostal/en/unit_types_numbered.txt +3 -0
- package/data/internal/dictionaries/libpostal/es/street_types.txt +2 -0
- package/data/internal/dictionaries/libpostal/fr/personal_titles.txt +4 -0
- package/data/internal/dictionaries/libpostal/fr/stopwords.txt +2 -0
- package/data/internal/dictionaries/libpostal/fr/street_types.txt +5 -0
- package/data/internal/dictionaries/libpostal/it/street_types.txt +2 -0
- package/data/internal/dictionaries/libpostal/ko/street_types.txt +1 -0
- package/data/internal/dictionaries/libpostal/nb/concatenated_suffixes_inseparable.txt +40 -0
- package/data/internal/dictionaries/libpostal/nb/directionals.txt +8 -0
- package/data/internal/dictionaries/libpostal/nb/street_types.txt +36 -0
- package/data/internal/dictionaries/libpostal/nl/concatenated_suffixes_inseparable.txt +1 -0
- package/data/internal/dictionaries/libpostal/nl/concatenated_suffixes_separable.txt +8 -0
- package/data/internal/dictionaries/libpostal/nl/directionals.txt +4 -0
- package/data/internal/dictionaries/libpostal/nl/personal_suffixes.txt +4 -0
- package/data/internal/dictionaries/libpostal/nl/personal_titles.txt +43 -0
- package/data/internal/dictionaries/libpostal/pl/place_names.txt +1 -0
- package/data/internal/dictionaries/libpostal/pl/synonyms.txt +1 -0
- package/data/internal/dictionaries/libpostal/sv/concatenated_suffixes_separable.txt +1 -0
- package/data/internal/dictionaries/whosonfirst/locality/name:eng_x_preferred.txt +81 -0
- package/data/internal/dictionaries/whosonfirst/locality/name:fra_x_preferred.txt +2 -0
- package/data/internal/dictionaries/whosonfirst/region/name:eng_x_preferred.txt +2 -0
- package/data/libpostal/dictionaries/README.md +88 -0
- package/data/libpostal/dictionaries/af/ambiguous_expansions.txt +8 -0
- package/data/libpostal/dictionaries/af/concatenated_suffixes_inseparable.txt +1 -0
- package/data/libpostal/dictionaries/af/concatenated_suffixes_separable.txt +14 -0
- package/data/libpostal/dictionaries/af/directionals.txt +12 -0
- package/data/libpostal/dictionaries/af/personal_titles.txt +23 -0
- package/data/libpostal/dictionaries/af/place_names.txt +2 -0
- package/data/libpostal/dictionaries/af/qualifiers.txt +4 -0
- package/data/libpostal/dictionaries/af/stopwords.txt +38 -0
- package/data/libpostal/dictionaries/af/street_types.txt +21 -0
- package/data/libpostal/dictionaries/all/ambiguous_expansions.txt +1 -0
- package/data/libpostal/dictionaries/all/chains.txt +504 -0
- package/data/libpostal/dictionaries/all/given_names.txt +12715 -0
- package/data/libpostal/dictionaries/all/people.txt +5 -0
- package/data/libpostal/dictionaries/all/surnames.txt +49375 -0
- package/data/libpostal/dictionaries/ar/personal_titles.txt +4 -0
- package/data/libpostal/dictionaries/ar/place_names.txt +1 -0
- package/data/libpostal/dictionaries/ar/street_types.txt +11 -0
- package/data/libpostal/dictionaries/ast/ambiguous_expansions.txt +1 -0
- package/data/libpostal/dictionaries/ast/personal_titles.txt +1 -0
- package/data/libpostal/dictionaries/ast/street_types.txt +3 -0
- package/data/libpostal/dictionaries/az/building_types.txt +1 -0
- package/data/libpostal/dictionaries/az/directionals.txt +8 -0
- package/data/libpostal/dictionaries/az/personal_titles.txt +3 -0
- package/data/libpostal/dictionaries/az/place_names.txt +1 -0
- package/data/libpostal/dictionaries/az/street_types.txt +18 -0
- package/data/libpostal/dictionaries/be/ambiguous_expansions.txt +8 -0
- package/data/libpostal/dictionaries/be/building_types.txt +2 -0
- package/data/libpostal/dictionaries/be/chains.txt +8 -0
- package/data/libpostal/dictionaries/be/directionals.txt +25 -0
- package/data/libpostal/dictionaries/be/house_numbers.txt +2 -0
- package/data/libpostal/dictionaries/be/personal_titles.txt +6 -0
- package/data/libpostal/dictionaries/be/qualifiers.txt +20 -0
- package/data/libpostal/dictionaries/be/street_types.txt +28 -0
- package/data/libpostal/dictionaries/be/unit_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/bg/ambiguous_expansions.txt +2 -0
- package/data/libpostal/dictionaries/bg/cross_streets.txt +10 -0
- package/data/libpostal/dictionaries/bg/directionals.txt +8 -0
- package/data/libpostal/dictionaries/bg/entrances.txt +2 -0
- package/data/libpostal/dictionaries/bg/level_types_numbered.txt +6 -0
- package/data/libpostal/dictionaries/bg/level_types_standalone.txt +4 -0
- package/data/libpostal/dictionaries/bg/near.txt +20 -0
- package/data/libpostal/dictionaries/bg/number.txt +2 -0
- package/data/libpostal/dictionaries/bg/personal_titles.txt +14 -0
- package/data/libpostal/dictionaries/bg/place_names.txt +6 -0
- package/data/libpostal/dictionaries/bg/post_office.txt +2 -0
- package/data/libpostal/dictionaries/bg/qualifiers.txt +10 -0
- package/data/libpostal/dictionaries/bg/staircases.txt +2 -0
- package/data/libpostal/dictionaries/bg/street_types.txt +6 -0
- package/data/libpostal/dictionaries/bg/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/bg/unit_types_numbered.txt +6 -0
- package/data/libpostal/dictionaries/br/personal_titles.txt +3 -0
- package/data/libpostal/dictionaries/br/place_names.txt +3 -0
- package/data/libpostal/dictionaries/br/qualifiers.txt +1 -0
- package/data/libpostal/dictionaries/br/stopwords.txt +4 -0
- package/data/libpostal/dictionaries/br/street_types.txt +40 -0
- package/data/libpostal/dictionaries/bs/ambiguous_expansions.txt +5 -0
- package/data/libpostal/dictionaries/bs/building_types.txt +1 -0
- package/data/libpostal/dictionaries/bs/cross_streets.txt +6 -0
- package/data/libpostal/dictionaries/bs/directionals.txt +4 -0
- package/data/libpostal/dictionaries/bs/entrances.txt +1 -0
- package/data/libpostal/dictionaries/bs/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/bs/level_types_mezzanine.txt +1 -0
- package/data/libpostal/dictionaries/bs/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/bs/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/bs/near.txt +5 -0
- package/data/libpostal/dictionaries/bs/no_number.txt +1 -0
- package/data/libpostal/dictionaries/bs/number.txt +1 -0
- package/data/libpostal/dictionaries/bs/personal_titles.txt +8 -0
- package/data/libpostal/dictionaries/bs/place_names.txt +9 -0
- package/data/libpostal/dictionaries/bs/post_office.txt +1 -0
- package/data/libpostal/dictionaries/bs/qualifiers.txt +2 -0
- package/data/libpostal/dictionaries/bs/staircases.txt +1 -0
- package/data/libpostal/dictionaries/bs/stopwords.txt +2 -0
- package/data/libpostal/dictionaries/bs/street_types.txt +12 -0
- package/data/libpostal/dictionaries/bs/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/bs/unit_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/ca/ambiguous_expansions.txt +9 -0
- package/data/libpostal/dictionaries/ca/cross_streets.txt +8 -0
- package/data/libpostal/dictionaries/ca/directionals.txt +9 -0
- package/data/libpostal/dictionaries/ca/elisions.txt +1 -0
- package/data/libpostal/dictionaries/ca/entrances.txt +1 -0
- package/data/libpostal/dictionaries/ca/given_names.txt +1 -0
- package/data/libpostal/dictionaries/ca/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/ca/level_types_mezzanine.txt +1 -0
- package/data/libpostal/dictionaries/ca/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/ca/level_types_standalone.txt +5 -0
- package/data/libpostal/dictionaries/ca/level_types_sub_basement.txt +1 -0
- package/data/libpostal/dictionaries/ca/near.txt +12 -0
- package/data/libpostal/dictionaries/ca/no_number.txt +1 -0
- package/data/libpostal/dictionaries/ca/number.txt +1 -0
- package/data/libpostal/dictionaries/ca/personal_titles.txt +10 -0
- package/data/libpostal/dictionaries/ca/place_names.txt +133 -0
- package/data/libpostal/dictionaries/ca/post_office.txt +1 -0
- package/data/libpostal/dictionaries/ca/postcodes.txt +1 -0
- package/data/libpostal/dictionaries/ca/qualifiers.txt +8 -0
- package/data/libpostal/dictionaries/ca/staircases.txt +1 -0
- package/data/libpostal/dictionaries/ca/stopwords.txt +31 -0
- package/data/libpostal/dictionaries/ca/street_types.txt +28 -0
- package/data/libpostal/dictionaries/ca/synonyms.txt +14 -0
- package/data/libpostal/dictionaries/ca/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/ca/unit_types_numbered.txt +10 -0
- package/data/libpostal/dictionaries/cs/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/cs/chains.txt +1 -0
- package/data/libpostal/dictionaries/cs/cross_streets.txt +9 -0
- package/data/libpostal/dictionaries/cs/directionals.txt +4 -0
- package/data/libpostal/dictionaries/cs/entrances.txt +1 -0
- package/data/libpostal/dictionaries/cs/house_numbers.txt +1 -0
- package/data/libpostal/dictionaries/cs/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/cs/level_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/cs/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/cs/near.txt +12 -0
- package/data/libpostal/dictionaries/cs/number.txt +1 -0
- package/data/libpostal/dictionaries/cs/personal_titles.txt +2 -0
- package/data/libpostal/dictionaries/cs/place_names.txt +47 -0
- package/data/libpostal/dictionaries/cs/post_office.txt +1 -0
- package/data/libpostal/dictionaries/cs/staircases.txt +1 -0
- package/data/libpostal/dictionaries/cs/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/cs/street_types.txt +6 -0
- package/data/libpostal/dictionaries/cs/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/cs/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/cy/building_types.txt +5 -0
- package/data/libpostal/dictionaries/cy/directionals.txt +4 -0
- package/data/libpostal/dictionaries/cy/personal_titles.txt +2 -0
- package/data/libpostal/dictionaries/cy/place_names.txt +22 -0
- package/data/libpostal/dictionaries/cy/qualifiers.txt +2 -0
- package/data/libpostal/dictionaries/cy/stopwords.txt +3 -0
- package/data/libpostal/dictionaries/cy/street_types.txt +22 -0
- package/data/libpostal/dictionaries/da/academic_degrees.txt +1 -0
- package/data/libpostal/dictionaries/da/ambiguous_expansions.txt +7 -0
- package/data/libpostal/dictionaries/da/building_types.txt +3 -0
- package/data/libpostal/dictionaries/da/concatenated_suffixes_inseparable.txt +21 -0
- package/data/libpostal/dictionaries/da/concatenated_suffixes_separable.txt +9 -0
- package/data/libpostal/dictionaries/da/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/da/directionals.txt +13 -0
- package/data/libpostal/dictionaries/da/entrances.txt +1 -0
- package/data/libpostal/dictionaries/da/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/da/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/da/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/da/near.txt +14 -0
- package/data/libpostal/dictionaries/da/number.txt +1 -0
- package/data/libpostal/dictionaries/da/personal_titles.txt +1 -0
- package/data/libpostal/dictionaries/da/place_names.txt +7 -0
- package/data/libpostal/dictionaries/da/post_office.txt +2 -0
- package/data/libpostal/dictionaries/da/staircases.txt +2 -0
- package/data/libpostal/dictionaries/da/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/da/street_types.txt +38 -0
- package/data/libpostal/dictionaries/da/synonyms.txt +2 -0
- package/data/libpostal/dictionaries/da/unit_directions.txt +3 -0
- package/data/libpostal/dictionaries/da/unit_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/de/academic_degrees.txt +5 -0
- package/data/libpostal/dictionaries/de/ambiguous_expansions.txt +18 -0
- package/data/libpostal/dictionaries/de/chains.txt +11 -0
- package/data/libpostal/dictionaries/de/company_types.txt +8 -0
- package/data/libpostal/dictionaries/de/concatenated_prefixes_separable.txt +17 -0
- package/data/libpostal/dictionaries/de/concatenated_suffixes_inseparable.txt +5 -0
- package/data/libpostal/dictionaries/de/concatenated_suffixes_separable.txt +16 -0
- package/data/libpostal/dictionaries/de/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/de/directionals.txt +41 -0
- package/data/libpostal/dictionaries/de/entrances.txt +1 -0
- package/data/libpostal/dictionaries/de/house_numbers.txt +1 -0
- package/data/libpostal/dictionaries/de/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/de/level_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/de/level_types_standalone.txt +4 -0
- package/data/libpostal/dictionaries/de/near.txt +16 -0
- package/data/libpostal/dictionaries/de/number.txt +1 -0
- package/data/libpostal/dictionaries/de/personal_suffixes.txt +2 -0
- package/data/libpostal/dictionaries/de/personal_titles.txt +18 -0
- package/data/libpostal/dictionaries/de/place_names.txt +123 -0
- package/data/libpostal/dictionaries/de/post_office.txt +1 -0
- package/data/libpostal/dictionaries/de/qualifiers.txt +3 -0
- package/data/libpostal/dictionaries/de/staircases.txt +2 -0
- package/data/libpostal/dictionaries/de/stopwords.txt +39 -0
- package/data/libpostal/dictionaries/de/street_types.txt +36 -0
- package/data/libpostal/dictionaries/de/synonyms.txt +16 -0
- package/data/libpostal/dictionaries/de/toponyms.txt +28 -0
- package/data/libpostal/dictionaries/de/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/de/unit_types_numbered.txt +7 -0
- package/data/libpostal/dictionaries/el/ambiguous_expansions.txt +1 -0
- package/data/libpostal/dictionaries/el/building_types.txt +2 -0
- package/data/libpostal/dictionaries/el/entrances.txt +2 -0
- package/data/libpostal/dictionaries/el/given_names.txt +6 -0
- package/data/libpostal/dictionaries/el/level_types_basement.txt +2 -0
- package/data/libpostal/dictionaries/el/level_types_mezzanine.txt +2 -0
- package/data/libpostal/dictionaries/el/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/el/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/el/personal_titles.txt +12 -0
- package/data/libpostal/dictionaries/el/place_names.txt +18 -0
- package/data/libpostal/dictionaries/el/post_office.txt +2 -0
- package/data/libpostal/dictionaries/el/postcodes.txt +2 -0
- package/data/libpostal/dictionaries/el/qualifiers.txt +6 -0
- package/data/libpostal/dictionaries/el/staircases.txt +2 -0
- package/data/libpostal/dictionaries/el/street_types.txt +6 -0
- package/data/libpostal/dictionaries/el/synonyms.txt +41 -0
- package/data/libpostal/dictionaries/el/toponyms.txt +3 -0
- package/data/libpostal/dictionaries/el/unit_types_numbered.txt +6 -0
- package/data/libpostal/dictionaries/en/academic_degrees.txt +27 -0
- package/data/libpostal/dictionaries/en/ambiguous_expansions.txt +178 -0
- package/data/libpostal/dictionaries/en/building_types.txt +19 -0
- package/data/libpostal/dictionaries/en/chains.txt +6 -0
- package/data/libpostal/dictionaries/en/company_types.txt +61 -0
- package/data/libpostal/dictionaries/en/cross_streets.txt +9 -0
- package/data/libpostal/dictionaries/en/directionals.txt +20 -0
- package/data/libpostal/dictionaries/en/entrances.txt +1 -0
- package/data/libpostal/dictionaries/en/given_names.txt +2 -0
- package/data/libpostal/dictionaries/en/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/en/level_types_mezzanine.txt +5 -0
- package/data/libpostal/dictionaries/en/level_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/en/level_types_standalone.txt +12 -0
- package/data/libpostal/dictionaries/en/level_types_sub_basement.txt +1 -0
- package/data/libpostal/dictionaries/en/near.txt +7 -0
- package/data/libpostal/dictionaries/en/no_number.txt +1 -0
- package/data/libpostal/dictionaries/en/nulls.txt +2 -0
- package/data/libpostal/dictionaries/en/number.txt +1 -0
- package/data/libpostal/dictionaries/en/personal_suffixes.txt +2 -0
- package/data/libpostal/dictionaries/en/personal_titles.txt +80 -0
- package/data/libpostal/dictionaries/en/place_names.txt +315 -0
- package/data/libpostal/dictionaries/en/post_office.txt +16 -0
- package/data/libpostal/dictionaries/en/qualifiers.txt +5 -0
- package/data/libpostal/dictionaries/en/staircases.txt +3 -0
- package/data/libpostal/dictionaries/en/stopwords.txt +14 -0
- package/data/libpostal/dictionaries/en/street_names.txt +358 -0
- package/data/libpostal/dictionaries/en/street_types.txt +410 -0
- package/data/libpostal/dictionaries/en/synonyms.txt +53 -0
- package/data/libpostal/dictionaries/en/toponyms.txt +80 -0
- package/data/libpostal/dictionaries/en/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/en/unit_types_numbered.txt +69 -0
- package/data/libpostal/dictionaries/en/unit_types_standalone.txt +16 -0
- package/data/libpostal/dictionaries/es/academic_degrees.txt +2 -0
- package/data/libpostal/dictionaries/es/ambiguous_expansions.txt +45 -0
- package/data/libpostal/dictionaries/es/building_types.txt +15 -0
- package/data/libpostal/dictionaries/es/company_types.txt +49 -0
- package/data/libpostal/dictionaries/es/cross_streets.txt +9 -0
- package/data/libpostal/dictionaries/es/directionals.txt +13 -0
- package/data/libpostal/dictionaries/es/entrances.txt +3 -0
- package/data/libpostal/dictionaries/es/given_names.txt +3 -0
- package/data/libpostal/dictionaries/es/house_numbers.txt +2 -0
- package/data/libpostal/dictionaries/es/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/es/level_types_mezzanine.txt +1 -0
- package/data/libpostal/dictionaries/es/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/es/level_types_standalone.txt +7 -0
- package/data/libpostal/dictionaries/es/level_types_sub_basement.txt +1 -0
- package/data/libpostal/dictionaries/es/near.txt +10 -0
- package/data/libpostal/dictionaries/es/no_number.txt +1 -0
- package/data/libpostal/dictionaries/es/number.txt +1 -0
- package/data/libpostal/dictionaries/es/personal_suffixes.txt +1 -0
- package/data/libpostal/dictionaries/es/personal_titles.txt +132 -0
- package/data/libpostal/dictionaries/es/place_names.txt +234 -0
- package/data/libpostal/dictionaries/es/post_office.txt +4 -0
- package/data/libpostal/dictionaries/es/postcodes.txt +1 -0
- package/data/libpostal/dictionaries/es/qualifiers.txt +34 -0
- package/data/libpostal/dictionaries/es/staircases.txt +2 -0
- package/data/libpostal/dictionaries/es/stopwords.txt +29 -0
- package/data/libpostal/dictionaries/es/street_types.txt +109 -0
- package/data/libpostal/dictionaries/es/surnames.txt +6 -0
- package/data/libpostal/dictionaries/es/synonyms.txt +58 -0
- package/data/libpostal/dictionaries/es/toponyms.txt +39 -0
- package/data/libpostal/dictionaries/es/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/es/unit_types_numbered.txt +15 -0
- package/data/libpostal/dictionaries/es/unit_types_standalone.txt +5 -0
- package/data/libpostal/dictionaries/et/ambiguous_expansions.txt +5 -0
- package/data/libpostal/dictionaries/et/building_types.txt +3 -0
- package/data/libpostal/dictionaries/et/company_types.txt +10 -0
- package/data/libpostal/dictionaries/et/cross_streets.txt +4 -0
- package/data/libpostal/dictionaries/et/directionals.txt +9 -0
- package/data/libpostal/dictionaries/et/entrances.txt +1 -0
- package/data/libpostal/dictionaries/et/level_types_basement.txt +2 -0
- package/data/libpostal/dictionaries/et/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/et/near.txt +4 -0
- package/data/libpostal/dictionaries/et/number.txt +1 -0
- package/data/libpostal/dictionaries/et/personal_titles.txt +13 -0
- package/data/libpostal/dictionaries/et/place_names.txt +39 -0
- package/data/libpostal/dictionaries/et/post_office.txt +2 -0
- package/data/libpostal/dictionaries/et/qualifiers.txt +6 -0
- package/data/libpostal/dictionaries/et/staircases.txt +1 -0
- package/data/libpostal/dictionaries/et/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/et/street_types.txt +10 -0
- package/data/libpostal/dictionaries/et/toponyms.txt +1 -0
- package/data/libpostal/dictionaries/et/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/et/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/eu/ambiguous_expansions.txt +2 -0
- package/data/libpostal/dictionaries/eu/cross_streets.txt +4 -0
- package/data/libpostal/dictionaries/eu/entrances.txt +1 -0
- package/data/libpostal/dictionaries/eu/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/eu/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/eu/near.txt +5 -0
- package/data/libpostal/dictionaries/eu/no_number.txt +1 -0
- package/data/libpostal/dictionaries/eu/place_names.txt +63 -0
- package/data/libpostal/dictionaries/eu/post_office.txt +1 -0
- package/data/libpostal/dictionaries/eu/postcodes.txt +1 -0
- package/data/libpostal/dictionaries/eu/qualifiers.txt +2 -0
- package/data/libpostal/dictionaries/eu/staircases.txt +1 -0
- package/data/libpostal/dictionaries/eu/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/eu/street_types.txt +18 -0
- package/data/libpostal/dictionaries/eu/unit_directions.txt +3 -0
- package/data/libpostal/dictionaries/eu/unit_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/fa/personal_titles.txt +6 -0
- package/data/libpostal/dictionaries/fa/place_names.txt +3 -0
- package/data/libpostal/dictionaries/fa/street_types.txt +7 -0
- package/data/libpostal/dictionaries/fi/ambiguous_expansions.txt +5 -0
- package/data/libpostal/dictionaries/fi/building_types.txt +3 -0
- package/data/libpostal/dictionaries/fi/chains.txt +1 -0
- package/data/libpostal/dictionaries/fi/concatenated_suffixes_separable.txt +20 -0
- package/data/libpostal/dictionaries/fi/cross_streets.txt +3 -0
- package/data/libpostal/dictionaries/fi/directionals.txt +4 -0
- package/data/libpostal/dictionaries/fi/entrances.txt +1 -0
- package/data/libpostal/dictionaries/fi/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/fi/near.txt +5 -0
- package/data/libpostal/dictionaries/fi/number.txt +1 -0
- package/data/libpostal/dictionaries/fi/post_office.txt +1 -0
- package/data/libpostal/dictionaries/fi/qualifiers.txt +2 -0
- package/data/libpostal/dictionaries/fi/staircases.txt +1 -0
- package/data/libpostal/dictionaries/fi/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/fi/street_types.txt +20 -0
- package/data/libpostal/dictionaries/fi/synonyms.txt +1 -0
- package/data/libpostal/dictionaries/fi/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/fi/unit_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/fil/street_types.txt +3 -0
- package/data/libpostal/dictionaries/fr/ambiguous_expansions.txt +25 -0
- package/data/libpostal/dictionaries/fr/building_types.txt +4 -0
- package/data/libpostal/dictionaries/fr/chains.txt +2 -0
- package/data/libpostal/dictionaries/fr/company_types.txt +40 -0
- package/data/libpostal/dictionaries/fr/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/fr/directionals.txt +12 -0
- package/data/libpostal/dictionaries/fr/elisions.txt +9 -0
- package/data/libpostal/dictionaries/fr/entrances.txt +2 -0
- package/data/libpostal/dictionaries/fr/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/fr/level_types_mezzanine.txt +1 -0
- package/data/libpostal/dictionaries/fr/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/fr/level_types_standalone.txt +8 -0
- package/data/libpostal/dictionaries/fr/level_types_sub_basement.txt +1 -0
- package/data/libpostal/dictionaries/fr/near.txt +20 -0
- package/data/libpostal/dictionaries/fr/no_number.txt +1 -0
- package/data/libpostal/dictionaries/fr/number.txt +1 -0
- package/data/libpostal/dictionaries/fr/people.txt +1 -0
- package/data/libpostal/dictionaries/fr/personal_titles.txt +57 -0
- package/data/libpostal/dictionaries/fr/place_names.txt +147 -0
- package/data/libpostal/dictionaries/fr/post_office.txt +3 -0
- package/data/libpostal/dictionaries/fr/qualifiers.txt +19 -0
- package/data/libpostal/dictionaries/fr/staircases.txt +1 -0
- package/data/libpostal/dictionaries/fr/stopwords.txt +28 -0
- package/data/libpostal/dictionaries/fr/street_types.txt +165 -0
- package/data/libpostal/dictionaries/fr/synonyms.txt +14 -0
- package/data/libpostal/dictionaries/fr/toponyms.txt +13 -0
- package/data/libpostal/dictionaries/fr/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/fr/unit_types_numbered.txt +10 -0
- package/data/libpostal/dictionaries/ga/building_types.txt +16 -0
- package/data/libpostal/dictionaries/ga/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/ga/personal_titles.txt +1 -0
- package/data/libpostal/dictionaries/ga/place_names.txt +10 -0
- package/data/libpostal/dictionaries/ga/street_types.txt +95 -0
- package/data/libpostal/dictionaries/ga/unit_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/gd/building_types.txt +8 -0
- package/data/libpostal/dictionaries/gd/directionals.txt +6 -0
- package/data/libpostal/dictionaries/gd/place_names.txt +7 -0
- package/data/libpostal/dictionaries/gd/qualifiers.txt +1 -0
- package/data/libpostal/dictionaries/gd/stopwords.txt +2 -0
- package/data/libpostal/dictionaries/gd/street_types.txt +52 -0
- package/data/libpostal/dictionaries/gl/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/gl/directionals.txt +8 -0
- package/data/libpostal/dictionaries/gl/personal_titles.txt +2 -0
- package/data/libpostal/dictionaries/gl/stopwords.txt +39 -0
- package/data/libpostal/dictionaries/gl/street_types.txt +26 -0
- package/data/libpostal/dictionaries/gl/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/gsw/ambiguous_expansions.txt +1 -0
- package/data/libpostal/dictionaries/gsw/concatenated_suffixes_separable.txt +8 -0
- package/data/libpostal/dictionaries/gsw/street_types.txt +8 -0
- package/data/libpostal/dictionaries/he/entrances.txt +2 -0
- package/data/libpostal/dictionaries/he/level_types_basement.txt +2 -0
- package/data/libpostal/dictionaries/he/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/he/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/he/personal_titles.txt +2 -0
- package/data/libpostal/dictionaries/he/post_office.txt +2 -0
- package/data/libpostal/dictionaries/he/street_types.txt +8 -0
- package/data/libpostal/dictionaries/he/unit_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/hi/street_types.txt +3 -0
- package/data/libpostal/dictionaries/hr/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/hr/building_types.txt +1 -0
- package/data/libpostal/dictionaries/hr/cross_streets.txt +6 -0
- package/data/libpostal/dictionaries/hr/directionals.txt +4 -0
- package/data/libpostal/dictionaries/hr/entrances.txt +1 -0
- package/data/libpostal/dictionaries/hr/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/hr/level_types_mezzanine.txt +1 -0
- package/data/libpostal/dictionaries/hr/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/hr/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/hr/near.txt +5 -0
- package/data/libpostal/dictionaries/hr/no_number.txt +1 -0
- package/data/libpostal/dictionaries/hr/personal_titles.txt +6 -0
- package/data/libpostal/dictionaries/hr/place_names.txt +18 -0
- package/data/libpostal/dictionaries/hr/post_office.txt +1 -0
- package/data/libpostal/dictionaries/hr/qualifiers.txt +1 -0
- package/data/libpostal/dictionaries/hr/staircases.txt +1 -0
- package/data/libpostal/dictionaries/hr/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/hr/street_types.txt +12 -0
- package/data/libpostal/dictionaries/hr/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/hr/unit_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/hu/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/hu/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/hu/directionals.txt +8 -0
- package/data/libpostal/dictionaries/hu/level_types_basement.txt +4 -0
- package/data/libpostal/dictionaries/hu/level_types_mezzanine.txt +2 -0
- package/data/libpostal/dictionaries/hu/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/hu/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/hu/near.txt +3 -0
- package/data/libpostal/dictionaries/hu/number.txt +1 -0
- package/data/libpostal/dictionaries/hu/personal_titles.txt +1 -0
- package/data/libpostal/dictionaries/hu/post_office.txt +1 -0
- package/data/libpostal/dictionaries/hu/stopwords.txt +4 -0
- package/data/libpostal/dictionaries/hu/street_types.txt +21 -0
- package/data/libpostal/dictionaries/hu/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/hu/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/id/academic_degrees.txt +78 -0
- package/data/libpostal/dictionaries/id/ambiguous_expansions.txt +64 -0
- package/data/libpostal/dictionaries/id/building_types.txt +7 -0
- package/data/libpostal/dictionaries/id/chains.txt +5 -0
- package/data/libpostal/dictionaries/id/company_types.txt +15 -0
- package/data/libpostal/dictionaries/id/cross_streets.txt +6 -0
- package/data/libpostal/dictionaries/id/directionals.txt +9 -0
- package/data/libpostal/dictionaries/id/entrances.txt +3 -0
- package/data/libpostal/dictionaries/id/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/id/level_types_standalone.txt +3 -0
- package/data/libpostal/dictionaries/id/near.txt +3 -0
- package/data/libpostal/dictionaries/id/number.txt +1 -0
- package/data/libpostal/dictionaries/id/personal_titles.txt +34 -0
- package/data/libpostal/dictionaries/id/place_names.txt +145 -0
- package/data/libpostal/dictionaries/id/qualifiers.txt +13 -0
- package/data/libpostal/dictionaries/id/stopwords.txt +9 -0
- package/data/libpostal/dictionaries/id/street_types.txt +7 -0
- package/data/libpostal/dictionaries/id/synonyms.txt +22 -0
- package/data/libpostal/dictionaries/id/toponyms.txt +34 -0
- package/data/libpostal/dictionaries/id/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/id/unit_types_numbered.txt +16 -0
- package/data/libpostal/dictionaries/id/unit_types_standalone.txt +9 -0
- package/data/libpostal/dictionaries/is/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/is/concatenated_suffixes_inseparable.txt +29 -0
- package/data/libpostal/dictionaries/is/cross_streets.txt +4 -0
- package/data/libpostal/dictionaries/is/directionals.txt +4 -0
- package/data/libpostal/dictionaries/is/entrances.txt +1 -0
- package/data/libpostal/dictionaries/is/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/is/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/is/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/is/near.txt +6 -0
- package/data/libpostal/dictionaries/is/number.txt +1 -0
- package/data/libpostal/dictionaries/is/post_office.txt +1 -0
- package/data/libpostal/dictionaries/is/qualifiers.txt +2 -0
- package/data/libpostal/dictionaries/is/staircases.txt +1 -0
- package/data/libpostal/dictionaries/is/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/is/street_types.txt +29 -0
- package/data/libpostal/dictionaries/is/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/is/unit_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/it/academic_degrees.txt +1 -0
- package/data/libpostal/dictionaries/it/ambiguous_expansions.txt +8 -0
- package/data/libpostal/dictionaries/it/building_types.txt +5 -0
- package/data/libpostal/dictionaries/it/chains.txt +5 -0
- package/data/libpostal/dictionaries/it/company_types.txt +16 -0
- package/data/libpostal/dictionaries/it/cross_streets.txt +7 -0
- package/data/libpostal/dictionaries/it/directionals.txt +11 -0
- package/data/libpostal/dictionaries/it/elisions.txt +4 -0
- package/data/libpostal/dictionaries/it/entrances.txt +1 -0
- package/data/libpostal/dictionaries/it/level_types_basement.txt +2 -0
- package/data/libpostal/dictionaries/it/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/it/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/it/near.txt +10 -0
- package/data/libpostal/dictionaries/it/no_number.txt +2 -0
- package/data/libpostal/dictionaries/it/number.txt +1 -0
- package/data/libpostal/dictionaries/it/personal_titles.txt +72 -0
- package/data/libpostal/dictionaries/it/place_names.txt +203 -0
- package/data/libpostal/dictionaries/it/post_office.txt +2 -0
- package/data/libpostal/dictionaries/it/qualifiers.txt +16 -0
- package/data/libpostal/dictionaries/it/staircases.txt +1 -0
- package/data/libpostal/dictionaries/it/stopwords.txt +47 -0
- package/data/libpostal/dictionaries/it/street_types.txt +151 -0
- package/data/libpostal/dictionaries/it/synonyms.txt +115 -0
- package/data/libpostal/dictionaries/it/toponyms.txt +110 -0
- package/data/libpostal/dictionaries/it/unit_types_numbered.txt +9 -0
- package/data/libpostal/dictionaries/ja/ambiguous_expansions.txt +5 -0
- package/data/libpostal/dictionaries/ja/building_types.txt +6 -0
- package/data/libpostal/dictionaries/ja/chains.txt +27 -0
- package/data/libpostal/dictionaries/ja/directionals.txt +16 -0
- package/data/libpostal/dictionaries/ja/level_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/ja/number.txt +2 -0
- package/data/libpostal/dictionaries/ja/place_names.txt +16 -0
- package/data/libpostal/dictionaries/ja/post_office.txt +2 -0
- package/data/libpostal/dictionaries/ja/postcodes.txt +2 -0
- package/data/libpostal/dictionaries/ja/qualifiers.txt +38 -0
- package/data/libpostal/dictionaries/ja/street_types.txt +67 -0
- package/data/libpostal/dictionaries/ka/ambiguous_expansions.txt +2 -0
- package/data/libpostal/dictionaries/ka/personal_titles.txt +4 -0
- package/data/libpostal/dictionaries/ka/place_names.txt +7 -0
- package/data/libpostal/dictionaries/ka/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/ka/street_types.txt +12 -0
- package/data/libpostal/dictionaries/ko/directionals.txt +31 -0
- package/data/libpostal/dictionaries/ko/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/ko/number.txt +3 -0
- package/data/libpostal/dictionaries/ko/post_office.txt +2 -0
- package/data/libpostal/dictionaries/ko/postcodes.txt +2 -0
- package/data/libpostal/dictionaries/ko/qualifiers.txt +6 -0
- package/data/libpostal/dictionaries/ko/street_types.txt +8 -0
- package/data/libpostal/dictionaries/lb/concatenated_suffixes_separable.txt +3 -0
- package/data/libpostal/dictionaries/lb/street_types.txt +3 -0
- package/data/libpostal/dictionaries/lt/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/lt/building_types.txt +1 -0
- package/data/libpostal/dictionaries/lt/cross_streets.txt +4 -0
- package/data/libpostal/dictionaries/lt/directionals.txt +4 -0
- package/data/libpostal/dictionaries/lt/entrances.txt +1 -0
- package/data/libpostal/dictionaries/lt/level_types_basement.txt +2 -0
- package/data/libpostal/dictionaries/lt/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/lt/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/lt/number.txt +1 -0
- package/data/libpostal/dictionaries/lt/post_office.txt +1 -0
- package/data/libpostal/dictionaries/lt/qualifiers.txt +5 -0
- package/data/libpostal/dictionaries/lt/staircases.txt +1 -0
- package/data/libpostal/dictionaries/lt/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/lt/street_types.txt +7 -0
- package/data/libpostal/dictionaries/lt/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/lt/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/lv/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/lv/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/lv/directionals.txt +4 -0
- package/data/libpostal/dictionaries/lv/entrances.txt +1 -0
- package/data/libpostal/dictionaries/lv/level_types_basement.txt +2 -0
- package/data/libpostal/dictionaries/lv/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/lv/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/lv/number.txt +1 -0
- package/data/libpostal/dictionaries/lv/place_names.txt +2 -0
- package/data/libpostal/dictionaries/lv/staircases.txt +2 -0
- package/data/libpostal/dictionaries/lv/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/lv/street_types.txt +5 -0
- package/data/libpostal/dictionaries/lv/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/lv/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/ms/ambiguous_expansions.txt +1 -0
- package/data/libpostal/dictionaries/ms/building_types.txt +10 -0
- package/data/libpostal/dictionaries/ms/company_types.txt +8 -0
- package/data/libpostal/dictionaries/ms/directionals.txt +9 -0
- package/data/libpostal/dictionaries/ms/given_names.txt +3 -0
- package/data/libpostal/dictionaries/ms/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/ms/personal_titles.txt +92 -0
- package/data/libpostal/dictionaries/ms/place_names.txt +145 -0
- package/data/libpostal/dictionaries/ms/post_office.txt +3 -0
- package/data/libpostal/dictionaries/ms/qualifiers.txt +6 -0
- package/data/libpostal/dictionaries/ms/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/ms/street_types.txt +35 -0
- package/data/libpostal/dictionaries/ms/synonyms.txt +27 -0
- package/data/libpostal/dictionaries/mt/ambiguous_expansions.txt +1 -0
- package/data/libpostal/dictionaries/mt/number.txt +1 -0
- package/data/libpostal/dictionaries/mt/personal_titles.txt +6 -0
- package/data/libpostal/dictionaries/mt/place_names.txt +1 -0
- package/data/libpostal/dictionaries/mt/stopwords.txt +5 -0
- package/data/libpostal/dictionaries/mt/street_types.txt +6 -0
- package/data/libpostal/dictionaries/nb/ambiguous_expansions.txt +11 -0
- package/data/libpostal/dictionaries/nb/building_types.txt +3 -0
- package/data/libpostal/dictionaries/nb/concatenated_suffixes_inseparable.txt +13 -0
- package/data/libpostal/dictionaries/nb/concatenated_suffixes_separable.txt +6 -0
- package/data/libpostal/dictionaries/nb/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/nb/directionals.txt +13 -0
- package/data/libpostal/dictionaries/nb/entrances.txt +1 -0
- package/data/libpostal/dictionaries/nb/level_types_numbered.txt +5 -0
- package/data/libpostal/dictionaries/nb/near.txt +7 -0
- package/data/libpostal/dictionaries/nb/number.txt +1 -0
- package/data/libpostal/dictionaries/nb/personal_titles.txt +1 -0
- package/data/libpostal/dictionaries/nb/post_office.txt +1 -0
- package/data/libpostal/dictionaries/nb/staircases.txt +2 -0
- package/data/libpostal/dictionaries/nb/stopwords.txt +34 -0
- package/data/libpostal/dictionaries/nb/street_types.txt +20 -0
- package/data/libpostal/dictionaries/nb/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/nb/unit_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/nl/ambiguous_expansions.txt +10 -0
- package/data/libpostal/dictionaries/nl/building_types.txt +1 -0
- package/data/libpostal/dictionaries/nl/chains.txt +1 -0
- package/data/libpostal/dictionaries/nl/concatenated_suffixes_inseparable.txt +3 -0
- package/data/libpostal/dictionaries/nl/concatenated_suffixes_separable.txt +13 -0
- package/data/libpostal/dictionaries/nl/cross_streets.txt +4 -0
- package/data/libpostal/dictionaries/nl/directionals.txt +20 -0
- package/data/libpostal/dictionaries/nl/entrances.txt +1 -0
- package/data/libpostal/dictionaries/nl/level_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/nl/level_types_standalone.txt +5 -0
- package/data/libpostal/dictionaries/nl/near.txt +7 -0
- package/data/libpostal/dictionaries/nl/number.txt +1 -0
- package/data/libpostal/dictionaries/nl/personal_titles.txt +32 -0
- package/data/libpostal/dictionaries/nl/place_names.txt +81 -0
- package/data/libpostal/dictionaries/nl/post_office.txt +1 -0
- package/data/libpostal/dictionaries/nl/qualifiers.txt +4 -0
- package/data/libpostal/dictionaries/nl/staircases.txt +2 -0
- package/data/libpostal/dictionaries/nl/stopwords.txt +38 -0
- package/data/libpostal/dictionaries/nl/street_types.txt +22 -0
- package/data/libpostal/dictionaries/nl/synonyms.txt +2 -0
- package/data/libpostal/dictionaries/nl/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/nl/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/oc/elisions.txt +1 -0
- package/data/libpostal/dictionaries/oc/stopwords.txt +14 -0
- package/data/libpostal/dictionaries/oc/street_types.txt +5 -0
- package/data/libpostal/dictionaries/pap/personal_titles.txt +2 -0
- package/data/libpostal/dictionaries/pap/street_types.txt +2 -0
- package/data/libpostal/dictionaries/pl/academic_degrees.txt +2 -0
- package/data/libpostal/dictionaries/pl/ambiguous_expansions.txt +9 -0
- package/data/libpostal/dictionaries/pl/building_types.txt +1 -0
- package/data/libpostal/dictionaries/pl/chains.txt +3 -0
- package/data/libpostal/dictionaries/pl/company_types.txt +4 -0
- package/data/libpostal/dictionaries/pl/cross_streets.txt +6 -0
- package/data/libpostal/dictionaries/pl/directionals.txt +8 -0
- package/data/libpostal/dictionaries/pl/entrances.txt +1 -0
- package/data/libpostal/dictionaries/pl/house_numbers.txt +1 -0
- package/data/libpostal/dictionaries/pl/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/pl/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/pl/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/pl/near.txt +11 -0
- package/data/libpostal/dictionaries/pl/number.txt +1 -0
- package/data/libpostal/dictionaries/pl/personal_suffixes.txt +2 -0
- package/data/libpostal/dictionaries/pl/personal_titles.txt +54 -0
- package/data/libpostal/dictionaries/pl/place_names.txt +31 -0
- package/data/libpostal/dictionaries/pl/post_office.txt +1 -0
- package/data/libpostal/dictionaries/pl/qualifiers.txt +9 -0
- package/data/libpostal/dictionaries/pl/staircases.txt +1 -0
- package/data/libpostal/dictionaries/pl/stopwords.txt +3 -0
- package/data/libpostal/dictionaries/pl/street_types.txt +12 -0
- package/data/libpostal/dictionaries/pl/synonyms.txt +19 -0
- package/data/libpostal/dictionaries/pl/toponyms.txt +1 -0
- package/data/libpostal/dictionaries/pl/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/pl/unit_types_numbered.txt +2 -0
- package/data/libpostal/dictionaries/pt/ambiguous_expansions.txt +12 -0
- package/data/libpostal/dictionaries/pt/building_types.txt +7 -0
- package/data/libpostal/dictionaries/pt/company_types.txt +31 -0
- package/data/libpostal/dictionaries/pt/cross_streets.txt +8 -0
- package/data/libpostal/dictionaries/pt/directionals.txt +8 -0
- package/data/libpostal/dictionaries/pt/elisions.txt +1 -0
- package/data/libpostal/dictionaries/pt/entrances.txt +1 -0
- package/data/libpostal/dictionaries/pt/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/pt/level_types_mezzanine.txt +1 -0
- package/data/libpostal/dictionaries/pt/level_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/pt/level_types_standalone.txt +5 -0
- package/data/libpostal/dictionaries/pt/level_types_sub_basement.txt +1 -0
- package/data/libpostal/dictionaries/pt/near.txt +13 -0
- package/data/libpostal/dictionaries/pt/no_number.txt +1 -0
- package/data/libpostal/dictionaries/pt/number.txt +1 -0
- package/data/libpostal/dictionaries/pt/personal_suffixes.txt +3 -0
- package/data/libpostal/dictionaries/pt/personal_titles.txt +101 -0
- package/data/libpostal/dictionaries/pt/place_names.txt +52 -0
- package/data/libpostal/dictionaries/pt/post_office.txt +2 -0
- package/data/libpostal/dictionaries/pt/postcodes.txt +2 -0
- package/data/libpostal/dictionaries/pt/qualifiers.txt +8 -0
- package/data/libpostal/dictionaries/pt/staircases.txt +1 -0
- package/data/libpostal/dictionaries/pt/stopwords.txt +35 -0
- package/data/libpostal/dictionaries/pt/street_types.txt +53 -0
- package/data/libpostal/dictionaries/pt/synonyms.txt +21 -0
- package/data/libpostal/dictionaries/pt/toponyms.txt +28 -0
- package/data/libpostal/dictionaries/pt/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/pt/unit_types_numbered.txt +10 -0
- package/data/libpostal/dictionaries/pt/unit_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/ro/ambiguous_expansions.txt +5 -0
- package/data/libpostal/dictionaries/ro/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/ro/directionals.txt +4 -0
- package/data/libpostal/dictionaries/ro/entrances.txt +1 -0
- package/data/libpostal/dictionaries/ro/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/ro/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/ro/near.txt +7 -0
- package/data/libpostal/dictionaries/ro/no_number.txt +1 -0
- package/data/libpostal/dictionaries/ro/number.txt +1 -0
- package/data/libpostal/dictionaries/ro/personal_titles.txt +14 -0
- package/data/libpostal/dictionaries/ro/post_office.txt +1 -0
- package/data/libpostal/dictionaries/ro/qualifiers.txt +1 -0
- package/data/libpostal/dictionaries/ro/staircases.txt +1 -0
- package/data/libpostal/dictionaries/ro/stopwords.txt +2 -0
- package/data/libpostal/dictionaries/ro/street_types.txt +13 -0
- package/data/libpostal/dictionaries/ro/unit_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/ru/ambiguous_expansions.txt +18 -0
- package/data/libpostal/dictionaries/ru/building_types.txt +2 -0
- package/data/libpostal/dictionaries/ru/chains.txt +42 -0
- package/data/libpostal/dictionaries/ru/company_types.txt +9 -0
- package/data/libpostal/dictionaries/ru/cross_streets.txt +11 -0
- package/data/libpostal/dictionaries/ru/directionals.txt +16 -0
- package/data/libpostal/dictionaries/ru/entrances.txt +2 -0
- package/data/libpostal/dictionaries/ru/house_numbers.txt +2 -0
- package/data/libpostal/dictionaries/ru/level_types_basement.txt +4 -0
- package/data/libpostal/dictionaries/ru/level_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/ru/level_types_standalone.txt +4 -0
- package/data/libpostal/dictionaries/ru/near.txt +26 -0
- package/data/libpostal/dictionaries/ru/no_number.txt +1 -0
- package/data/libpostal/dictionaries/ru/number.txt +2 -0
- package/data/libpostal/dictionaries/ru/personal_titles.txt +6 -0
- package/data/libpostal/dictionaries/ru/place_names.txt +160 -0
- package/data/libpostal/dictionaries/ru/post_office.txt +2 -0
- package/data/libpostal/dictionaries/ru/qualifiers.txt +31 -0
- package/data/libpostal/dictionaries/ru/staircases.txt +2 -0
- package/data/libpostal/dictionaries/ru/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/ru/street_types.txt +28 -0
- package/data/libpostal/dictionaries/ru/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/ru/unit_types_numbered.txt +10 -0
- package/data/libpostal/dictionaries/si/place_names.txt +8 -0
- package/data/libpostal/dictionaries/si/qualifiers.txt +4 -0
- package/data/libpostal/dictionaries/si/street_types.txt +2 -0
- package/data/libpostal/dictionaries/sk/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/sk/cross_streets.txt +8 -0
- package/data/libpostal/dictionaries/sk/directionals.txt +21 -0
- package/data/libpostal/dictionaries/sk/entrances.txt +1 -0
- package/data/libpostal/dictionaries/sk/house_numbers.txt +1 -0
- package/data/libpostal/dictionaries/sk/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/sk/level_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/sk/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/sk/near.txt +13 -0
- package/data/libpostal/dictionaries/sk/number.txt +1 -0
- package/data/libpostal/dictionaries/sk/personal_titles.txt +16 -0
- package/data/libpostal/dictionaries/sk/place_names.txt +28 -0
- package/data/libpostal/dictionaries/sk/post_office.txt +1 -0
- package/data/libpostal/dictionaries/sk/qualifiers.txt +3 -0
- package/data/libpostal/dictionaries/sk/staircases.txt +1 -0
- package/data/libpostal/dictionaries/sk/stopwords.txt +29 -0
- package/data/libpostal/dictionaries/sk/street_types.txt +20 -0
- package/data/libpostal/dictionaries/sk/toponyms.txt +1 -0
- package/data/libpostal/dictionaries/sk/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/sk/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/sl/ambiguous_expansions.txt +6 -0
- package/data/libpostal/dictionaries/sl/chains.txt +1 -0
- package/data/libpostal/dictionaries/sl/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/sl/directionals.txt +4 -0
- package/data/libpostal/dictionaries/sl/entrances.txt +1 -0
- package/data/libpostal/dictionaries/sl/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/sl/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/sl/level_types_standalone.txt +2 -0
- package/data/libpostal/dictionaries/sl/near.txt +7 -0
- package/data/libpostal/dictionaries/sl/no_number.txt +1 -0
- package/data/libpostal/dictionaries/sl/number.txt +1 -0
- package/data/libpostal/dictionaries/sl/personal_titles.txt +3 -0
- package/data/libpostal/dictionaries/sl/place_names.txt +1 -0
- package/data/libpostal/dictionaries/sl/post_office.txt +1 -0
- package/data/libpostal/dictionaries/sl/staircases.txt +1 -0
- package/data/libpostal/dictionaries/sl/stopwords.txt +7 -0
- package/data/libpostal/dictionaries/sl/street_types.txt +4 -0
- package/data/libpostal/dictionaries/sl/synonyms.txt +13 -0
- package/data/libpostal/dictionaries/sl/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/sl/unit_types_numbered.txt +3 -0
- package/data/libpostal/dictionaries/sr/ambiguous_expansions.txt +9 -0
- package/data/libpostal/dictionaries/sr/cross_streets.txt +10 -0
- package/data/libpostal/dictionaries/sr/directionals.txt +8 -0
- package/data/libpostal/dictionaries/sr/entrances.txt +2 -0
- package/data/libpostal/dictionaries/sr/level_types_basement.txt +2 -0
- package/data/libpostal/dictionaries/sr/level_types_numbered.txt +6 -0
- package/data/libpostal/dictionaries/sr/level_types_standalone.txt +4 -0
- package/data/libpostal/dictionaries/sr/number.txt +2 -0
- package/data/libpostal/dictionaries/sr/personal_titles.txt +14 -0
- package/data/libpostal/dictionaries/sr/place_names.txt +12 -0
- package/data/libpostal/dictionaries/sr/post_office.txt +6 -0
- package/data/libpostal/dictionaries/sr/staircases.txt +2 -0
- package/data/libpostal/dictionaries/sr/stopwords.txt +2 -0
- package/data/libpostal/dictionaries/sr/street_types.txt +17 -0
- package/data/libpostal/dictionaries/sr/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/sr/unit_types_numbered.txt +8 -0
- package/data/libpostal/dictionaries/sv/ambiguous_expansions.txt +9 -0
- package/data/libpostal/dictionaries/sv/company_types.txt +4 -0
- package/data/libpostal/dictionaries/sv/concatenated_suffixes_inseparable.txt +5 -0
- package/data/libpostal/dictionaries/sv/concatenated_suffixes_separable.txt +8 -0
- package/data/libpostal/dictionaries/sv/cross_streets.txt +5 -0
- package/data/libpostal/dictionaries/sv/directionals.txt +8 -0
- package/data/libpostal/dictionaries/sv/entrances.txt +2 -0
- package/data/libpostal/dictionaries/sv/level_types_numbered.txt +7 -0
- package/data/libpostal/dictionaries/sv/level_types_standalone.txt +5 -0
- package/data/libpostal/dictionaries/sv/near.txt +11 -0
- package/data/libpostal/dictionaries/sv/number.txt +1 -0
- package/data/libpostal/dictionaries/sv/personal_titles.txt +3 -0
- package/data/libpostal/dictionaries/sv/post_office.txt +2 -0
- package/data/libpostal/dictionaries/sv/staircases.txt +3 -0
- package/data/libpostal/dictionaries/sv/stopwords.txt +25 -0
- package/data/libpostal/dictionaries/sv/street_types.txt +13 -0
- package/data/libpostal/dictionaries/sv/synonyms.txt +4 -0
- package/data/libpostal/dictionaries/sv/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/sv/unit_types_numbered.txt +5 -0
- package/data/libpostal/dictionaries/th/chains.txt +2 -0
- package/data/libpostal/dictionaries/th/street_types.txt +10 -0
- package/data/libpostal/dictionaries/tr/ambiguous_expansions.txt +5 -0
- package/data/libpostal/dictionaries/tr/chains.txt +1 -0
- package/data/libpostal/dictionaries/tr/cross_streets.txt +4 -0
- package/data/libpostal/dictionaries/tr/directionals.txt +4 -0
- package/data/libpostal/dictionaries/tr/entrances.txt +1 -0
- package/data/libpostal/dictionaries/tr/level_types_basement.txt +1 -0
- package/data/libpostal/dictionaries/tr/level_types_mezzanine.txt +1 -0
- package/data/libpostal/dictionaries/tr/level_types_numbered.txt +1 -0
- package/data/libpostal/dictionaries/tr/level_types_standalone.txt +1 -0
- package/data/libpostal/dictionaries/tr/number.txt +2 -0
- package/data/libpostal/dictionaries/tr/personal_titles.txt +4 -0
- package/data/libpostal/dictionaries/tr/place_names.txt +2 -0
- package/data/libpostal/dictionaries/tr/post_office.txt +1 -0
- package/data/libpostal/dictionaries/tr/qualifiers.txt +5 -0
- package/data/libpostal/dictionaries/tr/staircases.txt +1 -0
- package/data/libpostal/dictionaries/tr/stopwords.txt +1 -0
- package/data/libpostal/dictionaries/tr/street_types.txt +10 -0
- package/data/libpostal/dictionaries/tr/unit_directions.txt +2 -0
- package/data/libpostal/dictionaries/tr/unit_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/uk/ambiguous_expansions.txt +8 -0
- package/data/libpostal/dictionaries/uk/chains.txt +7 -0
- package/data/libpostal/dictionaries/uk/cross_streets.txt +10 -0
- package/data/libpostal/dictionaries/uk/directionals.txt +8 -0
- package/data/libpostal/dictionaries/uk/entrances.txt +2 -0
- package/data/libpostal/dictionaries/uk/house_numbers.txt +4 -0
- package/data/libpostal/dictionaries/uk/level_types_basement.txt +4 -0
- package/data/libpostal/dictionaries/uk/level_types_numbered.txt +4 -0
- package/data/libpostal/dictionaries/uk/level_types_standalone.txt +4 -0
- package/data/libpostal/dictionaries/uk/near.txt +24 -0
- package/data/libpostal/dictionaries/uk/number.txt +2 -0
- package/data/libpostal/dictionaries/uk/personal_titles.txt +9 -0
- package/data/libpostal/dictionaries/uk/place_names.txt +161 -0
- package/data/libpostal/dictionaries/uk/post_office.txt +2 -0
- package/data/libpostal/dictionaries/uk/qualifiers.txt +8 -0
- package/data/libpostal/dictionaries/uk/staircases.txt +2 -0
- package/data/libpostal/dictionaries/uk/stopwords.txt +2 -0
- package/data/libpostal/dictionaries/uk/street_types.txt +26 -0
- package/data/libpostal/dictionaries/uk/unit_directions.txt +4 -0
- package/data/libpostal/dictionaries/uk/unit_types_numbered.txt +10 -0
- package/data/libpostal/dictionaries/ur/street_types.txt +7 -0
- package/data/libpostal/dictionaries/vi/ambiguous_expansions.txt +3 -0
- package/data/libpostal/dictionaries/vi/personal_titles.txt +1 -0
- package/data/libpostal/dictionaries/vi/place_names.txt +29 -0
- package/data/libpostal/dictionaries/vi/qualifiers.txt +5 -0
- package/data/libpostal/dictionaries/vi/street_types.txt +10 -0
- package/data/libpostal/dictionaries/zh/building_types.txt +2 -0
- package/data/libpostal/dictionaries/zh/chains.txt +2 -0
- package/data/libpostal/dictionaries/zh/directionals.txt +20 -0
- package/data/libpostal/dictionaries/zh/level_types_numbered.txt +5 -0
- package/data/libpostal/dictionaries/zh/number.txt +3 -0
- package/data/libpostal/dictionaries/zh/place_names.txt +2 -0
- package/data/libpostal/dictionaries/zh/post_office.txt +3 -0
- package/data/libpostal/dictionaries/zh/postcodes.txt +3 -0
- package/data/libpostal/dictionaries/zh/qualifiers.txt +19 -0
- package/data/libpostal/dictionaries/zh/stopwords.txt +2 -0
- package/data/libpostal/dictionaries/zh/street_types.txt +30 -0
- package/data/libpostal/dictionaries/zh/unit_types_numbered.txt +2 -0
- package/data/libpostal/resources-download.sh +44 -0
- package/data/whosonfirst/dictionaries/country/name:eng_x_preferred.txt +220 -0
- package/data/whosonfirst/dictionaries/country/wof:country.txt +215 -0
- package/data/whosonfirst/dictionaries/country/wof:country_alpha3.txt +216 -0
- package/data/whosonfirst/dictionaries/dependency/name:eng_x_preferred.txt +42 -0
- package/data/whosonfirst/dictionaries/dependency/wof:shortcode.txt +34 -0
- package/data/whosonfirst/dictionaries/locality/name:eng_x_preferred.txt +261365 -0
- package/data/whosonfirst/dictionaries/locality/name:fra_x_preferred.txt +77631 -0
- package/data/whosonfirst/dictionaries/region/abrv:eng_x_preferred.txt +441 -0
- package/data/whosonfirst/dictionaries/region/name:eng_x_preferred.txt +4517 -0
- package/data/whosonfirst/dictionaries/region/wof:shortcode.txt +839 -0
- package/out/classification/BaseClassifier.d.ts +38 -0
- package/out/classification/BaseClassifier.d.ts.map +1 -0
- package/out/classification/BaseClassifier.js +12 -0
- package/out/classification/BaseClassifier.js.map +1 -0
- package/out/classification/Classification.d.ts +79 -0
- package/out/classification/Classification.d.ts.map +1 -0
- package/out/classification/Classification.js +133 -0
- package/out/classification/Classification.js.map +1 -0
- package/out/classification/CompositeClassifier.d.ts +16 -0
- package/out/classification/CompositeClassifier.d.ts.map +1 -0
- package/out/classification/CompositeClassifier.js +113 -0
- package/out/classification/CompositeClassifier.js.map +1 -0
- package/out/classification/PhraseClassifier.d.ts +23 -0
- package/out/classification/PhraseClassifier.d.ts.map +1 -0
- package/out/classification/PhraseClassifier.js +32 -0
- package/out/classification/PhraseClassifier.js.map +1 -0
- package/out/classification/SectionClassifier.d.ts +23 -0
- package/out/classification/SectionClassifier.d.ts.map +1 -0
- package/out/classification/SectionClassifier.js +27 -0
- package/out/classification/SectionClassifier.js.map +1 -0
- package/out/classification/WordClassifier.d.ts +22 -0
- package/out/classification/WordClassifier.d.ts.map +1 -0
- package/out/classification/WordClassifier.js +33 -0
- package/out/classification/WordClassifier.js.map +1 -0
- package/out/classification/index.d.ts +13 -0
- package/out/classification/index.d.ts.map +1 -0
- package/out/classification/index.js +13 -0
- package/out/classification/index.js.map +1 -0
- package/out/classification/scheme.d.ts +46 -0
- package/out/classification/scheme.d.ts.map +1 -0
- package/out/classification/scheme.js +37 -0
- package/out/classification/scheme.js.map +1 -0
- package/out/decoder/build-tree.d.ts +31 -0
- package/out/decoder/build-tree.d.ts.map +1 -0
- package/out/decoder/build-tree.js +100 -0
- package/out/decoder/build-tree.js.map +1 -0
- package/out/decoder/containment.d.ts +19 -0
- package/out/decoder/containment.d.ts.map +1 -0
- package/out/decoder/containment.js +47 -0
- package/out/decoder/containment.js.map +1 -0
- package/out/decoder/index.d.ts +13 -0
- package/out/decoder/index.d.ts.map +1 -0
- package/out/decoder/index.js +13 -0
- package/out/decoder/index.js.map +1 -0
- package/out/decoder/proposals-to-tree.d.ts +19 -0
- package/out/decoder/proposals-to-tree.d.ts.map +1 -0
- package/out/decoder/proposals-to-tree.js +28 -0
- package/out/decoder/proposals-to-tree.js.map +1 -0
- package/out/decoder/serialize-json.d.ts +15 -0
- package/out/decoder/serialize-json.d.ts.map +1 -0
- package/out/decoder/serialize-json.js +24 -0
- package/out/decoder/serialize-json.js.map +1 -0
- package/out/decoder/serialize-tuples.d.ts +16 -0
- package/out/decoder/serialize-tuples.d.ts.map +1 -0
- package/out/decoder/serialize-tuples.js +25 -0
- package/out/decoder/serialize-tuples.js.map +1 -0
- package/out/decoder/serialize-xml.d.ts +36 -0
- package/out/decoder/serialize-xml.d.ts.map +1 -0
- package/out/decoder/serialize-xml.js +60 -0
- package/out/decoder/serialize-xml.js.map +1 -0
- package/out/decoder/types.d.ts +71 -0
- package/out/decoder/types.d.ts.map +1 -0
- package/out/decoder/types.js +23 -0
- package/out/decoder/types.js.map +1 -0
- package/out/filters/InvalidSolutionFilter.d.ts +19 -0
- package/out/filters/InvalidSolutionFilter.d.ts.map +1 -0
- package/out/filters/InvalidSolutionFilter.js +29 -0
- package/out/filters/InvalidSolutionFilter.js.map +1 -0
- package/out/filters/RelationshipFilter.d.ts +14 -0
- package/out/filters/RelationshipFilter.d.ts.map +1 -0
- package/out/filters/RelationshipFilter.js +64 -0
- package/out/filters/RelationshipFilter.js.map +1 -0
- package/out/filters/SubsetFilter.d.ts +10 -0
- package/out/filters/SubsetFilter.d.ts.map +1 -0
- package/out/filters/SubsetFilter.js +26 -0
- package/out/filters/SubsetFilter.js.map +1 -0
- package/out/filters/TokenDistanceFilter.d.ts +10 -0
- package/out/filters/TokenDistanceFilter.d.ts.map +1 -0
- package/out/filters/TokenDistanceFilter.js +30 -0
- package/out/filters/TokenDistanceFilter.js.map +1 -0
- package/out/filters/index.d.ts +10 -0
- package/out/filters/index.d.ts.map +1 -0
- package/out/filters/index.js +10 -0
- package/out/filters/index.js.map +1 -0
- package/out/formatter/index.d.ts +11 -0
- package/out/formatter/index.d.ts.map +1 -0
- package/out/formatter/index.js +49 -0
- package/out/formatter/index.js.map +1 -0
- package/out/index.d.ts +14 -0
- package/out/index.d.ts.map +1 -0
- package/out/index.js +18 -0
- package/out/index.js.map +1 -0
- package/out/locale/index.d.ts +9 -0
- package/out/locale/index.d.ts.map +1 -0
- package/out/locale/index.js +9 -0
- package/out/locale/index.js.map +1 -0
- package/out/locale/locale.d.ts +43 -0
- package/out/locale/locale.d.ts.map +1 -0
- package/out/locale/locale.js +16 -0
- package/out/locale/locale.js.map +1 -0
- package/out/locale/profiles/en-us.d.ts +12 -0
- package/out/locale/profiles/en-us.d.ts.map +1 -0
- package/out/locale/profiles/en-us.js +67 -0
- package/out/locale/profiles/en-us.js.map +1 -0
- package/out/locale/profiles/fr-fr.d.ts +14 -0
- package/out/locale/profiles/fr-fr.d.ts.map +1 -0
- package/out/locale/profiles/fr-fr.js +73 -0
- package/out/locale/profiles/fr-fr.js.map +1 -0
- package/out/locale/profiles/index.d.ts +9 -0
- package/out/locale/profiles/index.d.ts.map +1 -0
- package/out/locale/profiles/index.js +9 -0
- package/out/locale/profiles/index.js.map +1 -0
- package/out/locale/profiles/ja-jp.d.ts +17 -0
- package/out/locale/profiles/ja-jp.d.ts.map +1 -0
- package/out/locale/profiles/ja-jp.js +31 -0
- package/out/locale/profiles/ja-jp.js.map +1 -0
- package/out/locale/registry.d.ts +20 -0
- package/out/locale/registry.d.ts.map +1 -0
- package/out/locale/registry.js +49 -0
- package/out/locale/registry.js.map +1 -0
- package/out/parser/AddressParser.d.ts +97 -0
- package/out/parser/AddressParser.d.ts.map +1 -0
- package/out/parser/AddressParser.js +116 -0
- package/out/parser/AddressParser.js.map +1 -0
- package/out/parser/index.d.ts +8 -0
- package/out/parser/index.d.ts.map +1 -0
- package/out/parser/index.js +8 -0
- package/out/parser/index.js.map +1 -0
- package/out/parser/proposal-pipeline.d.ts +67 -0
- package/out/parser/proposal-pipeline.d.ts.map +1 -0
- package/out/parser/proposal-pipeline.js +127 -0
- package/out/parser/proposal-pipeline.js.map +1 -0
- package/out/policy/defaults.d.ts +21 -0
- package/out/policy/defaults.d.ts.map +1 -0
- package/out/policy/defaults.js +27 -0
- package/out/policy/defaults.js.map +1 -0
- package/out/policy/index.d.ts +9 -0
- package/out/policy/index.d.ts.map +1 -0
- package/out/policy/index.js +9 -0
- package/out/policy/index.js.map +1 -0
- package/out/policy/policy.d.ts +57 -0
- package/out/policy/policy.d.ts.map +1 -0
- package/out/policy/policy.js +12 -0
- package/out/policy/policy.js.map +1 -0
- package/out/policy/registry.d.ts +31 -0
- package/out/policy/registry.d.ts.map +1 -0
- package/out/policy/registry.js +114 -0
- package/out/policy/registry.js.map +1 -0
- package/out/resources/LocaleIndex.d.ts +54 -0
- package/out/resources/LocaleIndex.d.ts.map +1 -0
- package/out/resources/LocaleIndex.js +91 -0
- package/out/resources/LocaleIndex.js.map +1 -0
- package/out/resources/ResourceMapCache.d.ts +40 -0
- package/out/resources/ResourceMapCache.d.ts.map +1 -0
- package/out/resources/ResourceMapCache.js +75 -0
- package/out/resources/ResourceMapCache.js.map +1 -0
- package/out/resources/collections.d.ts +28 -0
- package/out/resources/collections.d.ts.map +1 -0
- package/out/resources/collections.js +76 -0
- package/out/resources/collections.js.map +1 -0
- package/out/resources/db/index.d.ts +57 -0
- package/out/resources/db/index.d.ts.map +1 -0
- package/out/resources/db/index.js +57 -0
- package/out/resources/db/index.js.map +1 -0
- package/out/resources/debugging.d.ts +16 -0
- package/out/resources/debugging.d.ts.map +1 -0
- package/out/resources/debugging.js +12 -0
- package/out/resources/debugging.js.map +1 -0
- package/out/resources/fs.d.ts +12 -0
- package/out/resources/fs.d.ts.map +1 -0
- package/out/resources/fs.js +13 -0
- package/out/resources/fs.js.map +1 -0
- package/out/resources/git.d.ts +24 -0
- package/out/resources/git.d.ts.map +1 -0
- package/out/resources/git.js +36 -0
- package/out/resources/git.js.map +1 -0
- package/out/resources/index.d.ts +19 -0
- package/out/resources/index.d.ts.map +1 -0
- package/out/resources/index.js +19 -0
- package/out/resources/index.js.map +1 -0
- package/out/resources/languages/index.d.ts +24 -0
- package/out/resources/languages/index.d.ts.map +1 -0
- package/out/resources/languages/index.js +43 -0
- package/out/resources/languages/index.js.map +1 -0
- package/out/resources/languages/types.gen.d.ts +259 -0
- package/out/resources/languages/types.gen.d.ts.map +1 -0
- package/out/resources/languages/types.gen.js +983 -0
- package/out/resources/languages/types.gen.js.map +1 -0
- package/out/resources/libaddressinput.d.ts +103 -0
- package/out/resources/libaddressinput.d.ts.map +1 -0
- package/out/resources/libaddressinput.js +30 -0
- package/out/resources/libaddressinput.js.map +1 -0
- package/out/resources/libpostal.d.ts +31 -0
- package/out/resources/libpostal.d.ts.map +1 -0
- package/out/resources/libpostal.js +117 -0
- package/out/resources/libpostal.js.map +1 -0
- package/out/resources/locale.d.ts +14 -0
- package/out/resources/locale.d.ts.map +1 -0
- package/out/resources/locale.js +22 -0
- package/out/resources/locale.js.map +1 -0
- package/out/resources/set.d.ts +62 -0
- package/out/resources/set.d.ts.map +1 -0
- package/out/resources/set.js +149 -0
- package/out/resources/set.js.map +1 -0
- package/out/resources/whosonfirst/DataSourceCache.d.ts +18 -0
- package/out/resources/whosonfirst/DataSourceCache.d.ts.map +1 -0
- package/out/resources/whosonfirst/DataSourceCache.js +53 -0
- package/out/resources/whosonfirst/DataSourceCache.js.map +1 -0
- package/out/resources/whosonfirst/PlacetypeDataSource.d.ts +74 -0
- package/out/resources/whosonfirst/PlacetypeDataSource.d.ts.map +1 -0
- package/out/resources/whosonfirst/PlacetypeDataSource.js +111 -0
- package/out/resources/whosonfirst/PlacetypeDataSource.js.map +1 -0
- package/out/resources/whosonfirst/index.d.ts +10 -0
- package/out/resources/whosonfirst/index.d.ts.map +1 -0
- package/out/resources/whosonfirst/index.js +10 -0
- package/out/resources/whosonfirst/index.js.map +1 -0
- package/out/resources/whosonfirst/loader.d.ts +56 -0
- package/out/resources/whosonfirst/loader.d.ts.map +1 -0
- package/out/resources/whosonfirst/loader.js +115 -0
- package/out/resources/whosonfirst/loader.js.map +1 -0
- package/out/resources/whosonfirst/placetypes/Placetype.d.ts +128 -0
- package/out/resources/whosonfirst/placetypes/Placetype.d.ts.map +1 -0
- package/out/resources/whosonfirst/placetypes/Placetype.js +338 -0
- package/out/resources/whosonfirst/placetypes/Placetype.js.map +1 -0
- package/out/resources/whosonfirst/placetypes/admin.d.ts +48 -0
- package/out/resources/whosonfirst/placetypes/admin.d.ts.map +1 -0
- package/out/resources/whosonfirst/placetypes/admin.js +61 -0
- package/out/resources/whosonfirst/placetypes/admin.js.map +1 -0
- package/out/resources/whosonfirst/placetypes/definition.d.ts +73 -0
- package/out/resources/whosonfirst/placetypes/definition.d.ts.map +1 -0
- package/out/resources/whosonfirst/placetypes/definition.js +26 -0
- package/out/resources/whosonfirst/placetypes/definition.js.map +1 -0
- package/out/resources/whosonfirst/placetypes/index.d.ts +10 -0
- package/out/resources/whosonfirst/placetypes/index.d.ts.map +1 -0
- package/out/resources/whosonfirst/placetypes/index.js +10 -0
- package/out/resources/whosonfirst/placetypes/index.js.map +1 -0
- package/out/resources/whosonfirst/placetypes/mermaid.d.ts +20 -0
- package/out/resources/whosonfirst/placetypes/mermaid.d.ts.map +1 -0
- package/out/resources/whosonfirst/placetypes/mermaid.js +44 -0
- package/out/resources/whosonfirst/placetypes/mermaid.js.map +1 -0
- package/out/solver/BaseSolver.d.ts +24 -0
- package/out/solver/BaseSolver.d.ts.map +1 -0
- package/out/solver/BaseSolver.js +7 -0
- package/out/solver/BaseSolver.js.map +1 -0
- package/out/solver/HashMapSolver.d.ts +15 -0
- package/out/solver/HashMapSolver.d.ts.map +1 -0
- package/out/solver/HashMapSolver.js +61 -0
- package/out/solver/HashMapSolver.js.map +1 -0
- package/out/solver/Solution.d.ts +69 -0
- package/out/solver/Solution.d.ts.map +1 -0
- package/out/solver/Solution.js +137 -0
- package/out/solver/Solution.js.map +1 -0
- package/out/solver/SolutionMatch.d.ts +69 -0
- package/out/solver/SolutionMatch.d.ts.map +1 -0
- package/out/solver/SolutionMatch.js +101 -0
- package/out/solver/SolutionMatch.js.map +1 -0
- package/out/solver/index.d.ts +11 -0
- package/out/solver/index.d.ts.map +1 -0
- package/out/solver/index.js +11 -0
- package/out/solver/index.js.map +1 -0
- package/out/solver/mask.d.ts +27 -0
- package/out/solver/mask.d.ts.map +1 -0
- package/out/solver/mask.js +52 -0
- package/out/solver/mask.js.map +1 -0
- package/out/solvers/ExclusiveCartesianSolver.d.ts +12 -0
- package/out/solvers/ExclusiveCartesianSolver.d.ts.map +1 -0
- package/out/solvers/ExclusiveCartesianSolver.js +58 -0
- package/out/solvers/ExclusiveCartesianSolver.js.map +1 -0
- package/out/solvers/HouseNumberPositionPenalty.d.ts +10 -0
- package/out/solvers/HouseNumberPositionPenalty.d.ts.map +1 -0
- package/out/solvers/HouseNumberPositionPenalty.js +63 -0
- package/out/solvers/HouseNumberPositionPenalty.js.map +1 -0
- package/out/solvers/LeadingAreaDeclassifier.d.ts +13 -0
- package/out/solvers/LeadingAreaDeclassifier.d.ts.map +1 -0
- package/out/solvers/LeadingAreaDeclassifier.js +35 -0
- package/out/solvers/LeadingAreaDeclassifier.js.map +1 -0
- package/out/solvers/MultiStreetSolver.d.ts +32 -0
- package/out/solvers/MultiStreetSolver.d.ts.map +1 -0
- package/out/solvers/MultiStreetSolver.js +110 -0
- package/out/solvers/MultiStreetSolver.js.map +1 -0
- package/out/solvers/OrphanedLevelTypeDeclassifier.d.ts +10 -0
- package/out/solvers/OrphanedLevelTypeDeclassifier.d.ts.map +1 -0
- package/out/solvers/OrphanedLevelTypeDeclassifier.js +21 -0
- package/out/solvers/OrphanedLevelTypeDeclassifier.js.map +1 -0
- package/out/solvers/OrphanedUnitTypeDeclassifier.d.ts +10 -0
- package/out/solvers/OrphanedUnitTypeDeclassifier.d.ts.map +1 -0
- package/out/solvers/OrphanedUnitTypeDeclassifier.js +21 -0
- package/out/solvers/OrphanedUnitTypeDeclassifier.js.map +1 -0
- package/out/solvers/PostcodePositionPenalty.d.ts +16 -0
- package/out/solvers/PostcodePositionPenalty.d.ts.map +1 -0
- package/out/solvers/PostcodePositionPenalty.js +33 -0
- package/out/solvers/PostcodePositionPenalty.js.map +1 -0
- package/out/solvers/VenueCaptureSolver.d.ts +13 -0
- package/out/solvers/VenueCaptureSolver.d.ts.map +1 -0
- package/out/solvers/VenueCaptureSolver.js +22 -0
- package/out/solvers/VenueCaptureSolver.js.map +1 -0
- package/out/solvers/index.d.ts +14 -0
- package/out/solvers/index.d.ts.map +1 -0
- package/out/solvers/index.js +14 -0
- package/out/solvers/index.js.map +1 -0
- package/out/tokenization/Graph.d.ts +35 -0
- package/out/tokenization/Graph.d.ts.map +1 -0
- package/out/tokenization/Graph.js +38 -0
- package/out/tokenization/Graph.js.map +1 -0
- package/out/tokenization/Span.d.ts +115 -0
- package/out/tokenization/Span.d.ts.map +1 -0
- package/out/tokenization/Span.js +223 -0
- package/out/tokenization/Span.js.map +1 -0
- package/out/tokenization/context.d.ts +39 -0
- package/out/tokenization/context.d.ts.map +1 -0
- package/out/tokenization/context.js +114 -0
- package/out/tokenization/context.js.map +1 -0
- package/out/tokenization/index.d.ts +11 -0
- package/out/tokenization/index.d.ts.map +1 -0
- package/out/tokenization/index.js +11 -0
- package/out/tokenization/index.js.map +1 -0
- package/out/tokenization/normalizer.d.ts +41 -0
- package/out/tokenization/normalizer.d.ts.map +1 -0
- package/out/tokenization/normalizer.js +94 -0
- package/out/tokenization/normalizer.js.map +1 -0
- package/out/tokenization/permutate.d.ts +29 -0
- package/out/tokenization/permutate.d.ts.map +1 -0
- package/out/tokenization/permutate.js +73 -0
- package/out/tokenization/permutate.js.map +1 -0
- package/out/tokenization/split.d.ts +22 -0
- package/out/tokenization/split.d.ts.map +1 -0
- package/out/tokenization/split.js +63 -0
- package/out/tokenization/split.js.map +1 -0
- package/out/types/classifier.d.ts +117 -0
- package/out/types/classifier.d.ts.map +1 -0
- package/out/types/classifier.js +19 -0
- package/out/types/classifier.js.map +1 -0
- package/out/types/component.d.ts +42 -0
- package/out/types/component.d.ts.map +1 -0
- package/out/types/component.js +69 -0
- package/out/types/component.js.map +1 -0
- package/out/types/index.d.ts +9 -0
- package/out/types/index.d.ts.map +1 -0
- package/out/types/index.js +9 -0
- package/out/types/index.js.map +1 -0
- package/out/types/mapping.d.ts +38 -0
- package/out/types/mapping.d.ts.map +1 -0
- package/out/types/mapping.js +71 -0
- package/out/types/mapping.js.map +1 -0
- package/out/utils/index.d.ts +7 -0
- package/out/utils/index.d.ts.map +1 -0
- package/out/utils/index.js +7 -0
- package/out/utils/index.js.map +1 -0
- package/out/utils/repo.d.ts +42 -0
- package/out/utils/repo.d.ts.map +1 -0
- package/out/utils/repo.js +72 -0
- package/out/utils/repo.js.map +1 -0
- package/out/vitest.config.d.ts +15 -0
- package/out/vitest.config.d.ts.map +1 -0
- package/out/vitest.config.js +45 -0
- package/out/vitest.config.js.map +1 -0
- package/package.json +45 -0
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
export * from "./ExclusiveCartesianSolver.js";
|
|
7
|
+
export * from "./HouseNumberPositionPenalty.js";
|
|
8
|
+
export * from "./LeadingAreaDeclassifier.js";
|
|
9
|
+
export * from "./MultiStreetSolver.js";
|
|
10
|
+
export * from "./OrphanedLevelTypeDeclassifier.js";
|
|
11
|
+
export * from "./OrphanedUnitTypeDeclassifier.js";
|
|
12
|
+
export * from "./PostcodePositionPenalty.js";
|
|
13
|
+
export * from "./VenueCaptureSolver.js";
|
|
14
|
+
//# sourceMappingURL=index.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../solvers/index.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,cAAc,+BAA+B,CAAA;AAC7C,cAAc,iCAAiC,CAAA;AAC/C,cAAc,8BAA8B,CAAA;AAC5C,cAAc,wBAAwB,CAAA;AACtC,cAAc,oCAAoC,CAAA;AAClD,cAAc,mCAAmC,CAAA;AACjD,cAAc,8BAA8B,CAAA;AAC5C,cAAc,yBAAyB,CAAA"}
|
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
export * from "./ExclusiveCartesianSolver.js";
|
|
7
|
+
export * from "./HouseNumberPositionPenalty.js";
|
|
8
|
+
export * from "./LeadingAreaDeclassifier.js";
|
|
9
|
+
export * from "./MultiStreetSolver.js";
|
|
10
|
+
export * from "./OrphanedLevelTypeDeclassifier.js";
|
|
11
|
+
export * from "./OrphanedUnitTypeDeclassifier.js";
|
|
12
|
+
export * from "./PostcodePositionPenalty.js";
|
|
13
|
+
export * from "./VenueCaptureSolver.js";
|
|
14
|
+
//# sourceMappingURL=index.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../solvers/index.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,cAAc,+BAA+B,CAAA;AAC7C,cAAc,iCAAiC,CAAA;AAC/C,cAAc,8BAA8B,CAAA;AAC5C,cAAc,wBAAwB,CAAA;AACtC,cAAc,oCAAoC,CAAA;AAClD,cAAc,mCAAmC,CAAA;AACjD,cAAc,8BAA8B,CAAA;AAC5C,cAAc,yBAAyB,CAAA"}
|
|
@@ -0,0 +1,35 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
import { Sequence } from "@mailwoman/core/resources";
|
|
7
|
+
export type GraphNodeCallback<G> = (node: G) => boolean;
|
|
8
|
+
/**
|
|
9
|
+
* A graph structure for storing relationships between nodes.
|
|
10
|
+
*/
|
|
11
|
+
export declare class Graph<GraphNode extends WeakKey> {
|
|
12
|
+
/**
|
|
13
|
+
* Parents of the graph, i.e. upward connections to the graph.
|
|
14
|
+
*/
|
|
15
|
+
parents: Sequence<GraphNode>;
|
|
16
|
+
/**
|
|
17
|
+
* Children of the graph, i.e. downward connections to the graph.
|
|
18
|
+
*/
|
|
19
|
+
children: Sequence<GraphNode>;
|
|
20
|
+
/**
|
|
21
|
+
* Previous siblings of the graph, i.e. leftward connections to the graph.
|
|
22
|
+
*/
|
|
23
|
+
readonly previousSiblings: Sequence<GraphNode>;
|
|
24
|
+
/**
|
|
25
|
+
* Next siblings of the graph, i.e. rightward connections to the graph.
|
|
26
|
+
*/
|
|
27
|
+
readonly nextSiblings: Sequence<GraphNode>;
|
|
28
|
+
/**
|
|
29
|
+
* Phrases identified in the graph, i.e. a sequence of nodes composing a classification.
|
|
30
|
+
*/
|
|
31
|
+
readonly phrases: Sequence<GraphNode>;
|
|
32
|
+
get nextSibling(): GraphNode | null;
|
|
33
|
+
get previousSibling(): GraphNode | null;
|
|
34
|
+
}
|
|
35
|
+
//# sourceMappingURL=Graph.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"Graph.d.ts","sourceRoot":"","sources":["../../tokenization/Graph.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,EAAE,QAAQ,EAAE,MAAM,2BAA2B,CAAA;AAEpD,MAAM,MAAM,iBAAiB,CAAC,CAAC,IAAI,CAAC,IAAI,EAAE,CAAC,KAAK,OAAO,CAAA;AAEvD;;GAEG;AACH,qBAAa,KAAK,CAAC,SAAS,SAAS,OAAO;IAC3C;;OAEG;IACI,OAAO,EAAE,QAAQ,CAAC,SAAS,CAAC,CAAiB;IAEpD;;OAEG;IACI,QAAQ,EAAE,QAAQ,CAAC,SAAS,CAAC,CAAiB;IAErD;;OAEG;IACH,SAAgB,gBAAgB,sBAA4B;IAC5D;;OAEG;IACH,SAAgB,YAAY,sBAA4B;IAExD;;OAEG;IACH,SAAgB,OAAO,EAAE,QAAQ,CAAC,SAAS,CAAC,CAA4B;IAExE,IAAW,WAAW,IAAI,SAAS,GAAG,IAAI,CAEzC;IAED,IAAW,eAAe,IAAI,SAAS,GAAG,IAAI,CAE7C;CACD"}
|
|
@@ -0,0 +1,38 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
import { Sequence } from "@mailwoman/core/resources";
|
|
7
|
+
/**
|
|
8
|
+
* A graph structure for storing relationships between nodes.
|
|
9
|
+
*/
|
|
10
|
+
export class Graph {
|
|
11
|
+
/**
|
|
12
|
+
* Parents of the graph, i.e. upward connections to the graph.
|
|
13
|
+
*/
|
|
14
|
+
parents = new Sequence();
|
|
15
|
+
/**
|
|
16
|
+
* Children of the graph, i.e. downward connections to the graph.
|
|
17
|
+
*/
|
|
18
|
+
children = new Sequence();
|
|
19
|
+
/**
|
|
20
|
+
* Previous siblings of the graph, i.e. leftward connections to the graph.
|
|
21
|
+
*/
|
|
22
|
+
previousSiblings = new Sequence();
|
|
23
|
+
/**
|
|
24
|
+
* Next siblings of the graph, i.e. rightward connections to the graph.
|
|
25
|
+
*/
|
|
26
|
+
nextSiblings = new Sequence();
|
|
27
|
+
/**
|
|
28
|
+
* Phrases identified in the graph, i.e. a sequence of nodes composing a classification.
|
|
29
|
+
*/
|
|
30
|
+
phrases = new Sequence();
|
|
31
|
+
get nextSibling() {
|
|
32
|
+
return this.nextSiblings.first;
|
|
33
|
+
}
|
|
34
|
+
get previousSibling() {
|
|
35
|
+
return this.previousSiblings.first;
|
|
36
|
+
}
|
|
37
|
+
}
|
|
38
|
+
//# sourceMappingURL=Graph.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"Graph.js","sourceRoot":"","sources":["../../tokenization/Graph.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,EAAE,QAAQ,EAAE,MAAM,2BAA2B,CAAA;AAIpD;;GAEG;AACH,MAAM,OAAO,KAAK;IACjB;;OAEG;IACI,OAAO,GAAwB,IAAI,QAAQ,EAAE,CAAA;IAEpD;;OAEG;IACI,QAAQ,GAAwB,IAAI,QAAQ,EAAE,CAAA;IAErD;;OAEG;IACa,gBAAgB,GAAG,IAAI,QAAQ,EAAa,CAAA;IAC5D;;OAEG;IACa,YAAY,GAAG,IAAI,QAAQ,EAAa,CAAA;IAExD;;OAEG;IACa,OAAO,GAAwB,IAAI,QAAQ,EAAa,CAAA;IAExE,IAAW,WAAW;QACrB,OAAO,IAAI,CAAC,YAAY,CAAC,KAAK,CAAA;IAC/B,CAAC;IAED,IAAW,eAAe;QACzB,OAAO,IAAI,CAAC,gBAAgB,CAAC,KAAK,CAAA;IACnC,CAAC;CACD"}
|
|
@@ -0,0 +1,115 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
import { type Classification, type ClassificationMatch, ClassificationsMatchMap } from "../classification/Classification.js";
|
|
7
|
+
import type { Displayable } from "../resources/debugging.js";
|
|
8
|
+
import type { Alpha3bLanguageCode } from "../resources/languages/index.js";
|
|
9
|
+
import type { LibPostalLanguageCode } from "../resources/libpostal.js";
|
|
10
|
+
import { Graph } from "./Graph.js";
|
|
11
|
+
export interface SpanCreationOptions {
|
|
12
|
+
start?: number;
|
|
13
|
+
classifications?: Iterable<Classification>;
|
|
14
|
+
children?: Iterable<Span>;
|
|
15
|
+
}
|
|
16
|
+
declare const kSpanID: unique symbol;
|
|
17
|
+
export interface SerializedSpan {
|
|
18
|
+
body: string;
|
|
19
|
+
start: number;
|
|
20
|
+
end: number;
|
|
21
|
+
normalized: string;
|
|
22
|
+
classifications: ClassificationMatch[];
|
|
23
|
+
children: SerializedSpan[];
|
|
24
|
+
phrases: SerializedSpan[];
|
|
25
|
+
}
|
|
26
|
+
/**
|
|
27
|
+
* A span of text, i.e. a token or a phrase.
|
|
28
|
+
*/
|
|
29
|
+
export declare class Span extends Graph<Span> {
|
|
30
|
+
#private;
|
|
31
|
+
/**
|
|
32
|
+
* The start index of the span.
|
|
33
|
+
*/
|
|
34
|
+
start: number;
|
|
35
|
+
/**
|
|
36
|
+
* The end index of the span.
|
|
37
|
+
*/
|
|
38
|
+
end: number;
|
|
39
|
+
/**
|
|
40
|
+
* The unique identifier for this span.
|
|
41
|
+
*/
|
|
42
|
+
protected static IDCounter: number;
|
|
43
|
+
/**
|
|
44
|
+
* The unique identifier for this span.
|
|
45
|
+
*/
|
|
46
|
+
readonly [kSpanID]: number;
|
|
47
|
+
get id(): number;
|
|
48
|
+
/**
|
|
49
|
+
* The normalized body of the span.
|
|
50
|
+
*/
|
|
51
|
+
normalized: string;
|
|
52
|
+
/**
|
|
53
|
+
* Classifications for this span.
|
|
54
|
+
*/
|
|
55
|
+
readonly classifications: ClassificationsMatchMap;
|
|
56
|
+
/**
|
|
57
|
+
* Boolean-like indications that hint at the nature of the span.
|
|
58
|
+
*
|
|
59
|
+
* Unlike classifications, these are not exposed in the final output.
|
|
60
|
+
*/
|
|
61
|
+
get flags(): ReadonlySet<SpanFlag>;
|
|
62
|
+
is(classification: Classification): boolean;
|
|
63
|
+
static from(input?: string, options?: SpanCreationOptions): Span;
|
|
64
|
+
static from(input: Span, options?: Omit<SpanCreationOptions, "start">): Span;
|
|
65
|
+
static from(input: Span | string, options?: SpanCreationOptions): Span;
|
|
66
|
+
constructor(body?: string, start?: number);
|
|
67
|
+
get body(): string;
|
|
68
|
+
/**
|
|
69
|
+
* Set the body of the Span
|
|
70
|
+
*/
|
|
71
|
+
set body(nextBody: string);
|
|
72
|
+
/**
|
|
73
|
+
* Predicate to determine if this Span intersects another Span
|
|
74
|
+
*/
|
|
75
|
+
intersects(that: Pick<Span, "start" | "end">): boolean;
|
|
76
|
+
/**
|
|
77
|
+
* Predicate to determine if this Span covers another Span
|
|
78
|
+
*/
|
|
79
|
+
covers(that: Pick<Span, "start" | "end">): boolean;
|
|
80
|
+
/**
|
|
81
|
+
* Returns the distance between two Spans
|
|
82
|
+
*
|
|
83
|
+
* @todo Use graph to find prev and next spans for a more accurate result
|
|
84
|
+
*
|
|
85
|
+
* @todo Or base 'distance' on word distance (slop) rather than characters
|
|
86
|
+
*/
|
|
87
|
+
distance(that: Pick<Span, "start" | "end">): number;
|
|
88
|
+
/**
|
|
89
|
+
* Returns the coverage of the span, i.e. the number of characters covered by the span and its
|
|
90
|
+
* children.
|
|
91
|
+
*/
|
|
92
|
+
get coverage(): number;
|
|
93
|
+
/**
|
|
94
|
+
* The combined languages of the span's children.
|
|
95
|
+
*/
|
|
96
|
+
get languages(): Displayable<ReadonlySet<LibPostalLanguageCode | Alpha3bLanguageCode>>;
|
|
97
|
+
/**
|
|
98
|
+
* Serialize the span to JSON.
|
|
99
|
+
*/
|
|
100
|
+
toJSON(): SerializedSpan;
|
|
101
|
+
toString(): string;
|
|
102
|
+
/**
|
|
103
|
+
* Connect siblings in the graph.
|
|
104
|
+
*/
|
|
105
|
+
static connectSiblings(...spans: Span[]): Span[];
|
|
106
|
+
}
|
|
107
|
+
export type SpanFlag = "ends_with_period" | "numeric" | "alpha" | "alphanumeric" | "numeral" | "punctuation";
|
|
108
|
+
/**
|
|
109
|
+
* Patterns to test and apply classifications to spans.
|
|
110
|
+
*
|
|
111
|
+
* Note that order here is important, as the first pattern that matches will be used.
|
|
112
|
+
*/
|
|
113
|
+
export declare const PatternMatchers: readonly [pattern: RegExp, flag: SpanFlag][];
|
|
114
|
+
export {};
|
|
115
|
+
//# sourceMappingURL=Span.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"Span.d.ts","sourceRoot":"","sources":["../../tokenization/Span.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAMH,OAAO,EACN,KAAK,cAAc,EACnB,KAAK,mBAAmB,EACxB,uBAAuB,EACvB,MAAM,qCAAqC,CAAA;AAC5C,OAAO,KAAK,EAAE,WAAW,EAAE,MAAM,2BAA2B,CAAA;AAC5D,OAAO,KAAK,EAAE,mBAAmB,EAAE,MAAM,iCAAiC,CAAA;AAC1E,OAAO,KAAK,EAAE,qBAAqB,EAAE,MAAM,2BAA2B,CAAA;AACtE,OAAO,EAAE,KAAK,EAAE,MAAM,YAAY,CAAA;AAIlC,MAAM,WAAW,mBAAmB;IACnC,KAAK,CAAC,EAAE,MAAM,CAAA;IACd,eAAe,CAAC,EAAE,QAAQ,CAAC,cAAc,CAAC,CAAA;IAC1C,QAAQ,CAAC,EAAE,QAAQ,CAAC,IAAI,CAAC,CAAA;CACzB;AAED,QAAA,MAAM,OAAO,EAAE,OAAO,MAAyB,CAAA;AAE/C,MAAM,WAAW,cAAc;IAE9B,IAAI,EAAE,MAAM,CAAA;IACZ,KAAK,EAAE,MAAM,CAAA;IACb,GAAG,EAAE,MAAM,CAAA;IACX,UAAU,EAAE,MAAM,CAAA;IAClB,eAAe,EAAE,mBAAmB,EAAE,CAAA;IACtC,QAAQ,EAAE,cAAc,EAAE,CAAA;IAC1B,OAAO,EAAE,cAAc,EAAE,CAAA;CACzB;AAED;;GAEG;AACH,qBAAa,IAAK,SAAQ,KAAK,CAAC,IAAI,CAAC;;IAEpC;;OAEG;IACI,KAAK,EAAE,MAAM,CAAA;IAEpB;;OAEG;IACI,GAAG,EAAG,MAAM,CAAA;IAEnB;;OAEG;IACH,SAAS,CAAC,MAAM,CAAC,SAAS,SAAI;IAE9B;;OAEG;IACH,QAAQ,CAAC,CAAC,OAAO,CAAC,EAAG,MAAM,CAAA;IAE3B,IAAW,EAAE,IAAI,MAAM,CAEtB;IAED;;OAEG;IACI,UAAU,SAAK;IAEtB;;OAEG;IACH,SAAgB,eAAe,EAAE,uBAAuB,CAAgC;IAIxF;;;;OAIG;IACH,IAAW,KAAK,IAAI,WAAW,CAAC,QAAQ,CAAC,CAExC;IAEM,EAAE,CAAC,cAAc,EAAE,cAAc,GAAG,OAAO;IAIlD,MAAM,CAAC,IAAI,CAAC,KAAK,CAAC,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,mBAAmB,GAAG,IAAI;IAChE,MAAM,CAAC,IAAI,CAAC,KAAK,EAAE,IAAI,EAAE,OAAO,CAAC,EAAE,IAAI,CAAC,mBAAmB,EAAE,OAAO,CAAC,GAAG,IAAI;IAC5E,MAAM,CAAC,IAAI,CAAC,KAAK,EAAE,IAAI,GAAG,MAAM,EAAE,OAAO,CAAC,EAAE,mBAAmB,GAAG,IAAI;gBAa1D,IAAI,SAAK,EAAE,KAAK,SAAI;IAgBhC,IAAI,IAAI,IAAI,MAAM,CAEjB;IAED;;OAEG;IACH,IAAI,IAAI,CAAC,QAAQ,EAAE,MAAM,EAsBxB;IAED;;OAEG;IACI,UAAU,CAAC,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,OAAO,GAAG,KAAK,CAAC,GAAG,OAAO;IAI7D;;OAEG;IACI,MAAM,CAAC,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,OAAO,GAAG,KAAK,CAAC,GAAG,OAAO;IAIzD;;;;;;OAMG;IACI,QAAQ,CAAC,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,OAAO,GAAG,KAAK,CAAC,GAAG,MAAM;IAS1D;;;OAGG;IACH,IAAW,QAAQ,IAAI,MAAM,CAU5B;IAED;;OAEG;IACH,IAAW,SAAS,IAAI,WAAW,CAAC,WAAW,CAAC,qBAAqB,GAAG,mBAAmB,CAAC,CAAC,CAwB5F;IAED;;OAEG;IACI,MAAM,IAAI,cAAc;IAiBf,QAAQ;IAWxB;;OAEG;IACH,MAAM,CAAC,eAAe,CAAC,GAAG,KAAK,EAAE,IAAI,EAAE;CAavC;AAED,MAAM,MAAM,QAAQ,GAAG,kBAAkB,GAAG,SAAS,GAAG,OAAO,GAAG,cAAc,GAAG,SAAS,GAAG,aAAa,CAAA;AAE5G;;;;GAIG;AACH,eAAO,MAAM,eAAe,EAAE,SAAS,CAAC,OAAO,EAAE,MAAM,EAAE,IAAI,EAAE,QAAQ,CAAC,EAYvE,CAAA"}
|
|
@@ -0,0 +1,223 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
// Imported via deep relative path (not @mailwoman/core/classification) to avoid a runtime cycle:
|
|
7
|
+
// classification/index.ts re-exports SectionClassifier / WordClassifier which themselves import
|
|
8
|
+
// Span from @mailwoman/core/tokenization, creating a TDZ that surfaces as "Class extends value
|
|
9
|
+
// undefined" when the source-mode test runner loads tokenization first.
|
|
10
|
+
import { ClassificationsMatchMap, } from "../classification/Classification.js";
|
|
11
|
+
import { Graph } from "./Graph.js";
|
|
12
|
+
const MAX_SPAN_LENGTH = 140;
|
|
13
|
+
const kSpanID = Symbol("SpanID");
|
|
14
|
+
/**
|
|
15
|
+
* A span of text, i.e. a token or a phrase.
|
|
16
|
+
*/
|
|
17
|
+
export class Span extends Graph {
|
|
18
|
+
#body = "";
|
|
19
|
+
/**
|
|
20
|
+
* The start index of the span.
|
|
21
|
+
*/
|
|
22
|
+
start;
|
|
23
|
+
/**
|
|
24
|
+
* The end index of the span.
|
|
25
|
+
*/
|
|
26
|
+
end;
|
|
27
|
+
/**
|
|
28
|
+
* The unique identifier for this span.
|
|
29
|
+
*/
|
|
30
|
+
static IDCounter = 0;
|
|
31
|
+
/**
|
|
32
|
+
* The unique identifier for this span.
|
|
33
|
+
*/
|
|
34
|
+
[kSpanID];
|
|
35
|
+
get id() {
|
|
36
|
+
return this[kSpanID];
|
|
37
|
+
}
|
|
38
|
+
/**
|
|
39
|
+
* The normalized body of the span.
|
|
40
|
+
*/
|
|
41
|
+
normalized = "";
|
|
42
|
+
/**
|
|
43
|
+
* Classifications for this span.
|
|
44
|
+
*/
|
|
45
|
+
classifications = new ClassificationsMatchMap();
|
|
46
|
+
#flags = new Set();
|
|
47
|
+
/**
|
|
48
|
+
* Boolean-like indications that hint at the nature of the span.
|
|
49
|
+
*
|
|
50
|
+
* Unlike classifications, these are not exposed in the final output.
|
|
51
|
+
*/
|
|
52
|
+
get flags() {
|
|
53
|
+
return this.#flags;
|
|
54
|
+
}
|
|
55
|
+
is(classification) {
|
|
56
|
+
return this.classifications.has(classification);
|
|
57
|
+
}
|
|
58
|
+
static from(input = "", options = {}) {
|
|
59
|
+
const span = input instanceof Span ? input : new Span(input, options.start);
|
|
60
|
+
for (const classification of options.classifications ?? []) {
|
|
61
|
+
span.classifications.add(classification);
|
|
62
|
+
}
|
|
63
|
+
span.children.add(...(options.children ?? []));
|
|
64
|
+
return span;
|
|
65
|
+
}
|
|
66
|
+
constructor(body = "", start = 0) {
|
|
67
|
+
super();
|
|
68
|
+
// this[kSpanID] = Span.IDCounter++
|
|
69
|
+
Object.defineProperty(this, kSpanID, {
|
|
70
|
+
value: Span.IDCounter++,
|
|
71
|
+
writable: false,
|
|
72
|
+
enumerable: false,
|
|
73
|
+
configurable: false,
|
|
74
|
+
});
|
|
75
|
+
// Note that `start` should be set first to ensure that `end` is calculated correctly.
|
|
76
|
+
this.start = start;
|
|
77
|
+
this.body = body;
|
|
78
|
+
}
|
|
79
|
+
get body() {
|
|
80
|
+
return this.#body;
|
|
81
|
+
}
|
|
82
|
+
/**
|
|
83
|
+
* Set the body of the Span
|
|
84
|
+
*/
|
|
85
|
+
set body(nextBody) {
|
|
86
|
+
this.#flags.clear();
|
|
87
|
+
this.#body = nextBody.slice(0, MAX_SPAN_LENGTH);
|
|
88
|
+
this.normalized = this.#body.toLowerCase();
|
|
89
|
+
this.end = this.start + this.#body.length;
|
|
90
|
+
for (const [pattern, flag] of PatternMatchers) {
|
|
91
|
+
if (pattern.test(this.normalized)) {
|
|
92
|
+
this.#flags.add(flag);
|
|
93
|
+
break;
|
|
94
|
+
}
|
|
95
|
+
}
|
|
96
|
+
if (this.flags.has("numeric") || this.flags.has("alphanumeric")) {
|
|
97
|
+
this.#flags.add("numeral");
|
|
98
|
+
}
|
|
99
|
+
if (this.#body.slice(-1) === ".") {
|
|
100
|
+
this.#flags.add("ends_with_period");
|
|
101
|
+
}
|
|
102
|
+
}
|
|
103
|
+
/**
|
|
104
|
+
* Predicate to determine if this Span intersects another Span
|
|
105
|
+
*/
|
|
106
|
+
intersects(that) {
|
|
107
|
+
return this.start < that.end && this.end > that.start;
|
|
108
|
+
}
|
|
109
|
+
/**
|
|
110
|
+
* Predicate to determine if this Span covers another Span
|
|
111
|
+
*/
|
|
112
|
+
covers(that) {
|
|
113
|
+
return this.start <= that.start && this.end >= that.end;
|
|
114
|
+
}
|
|
115
|
+
/**
|
|
116
|
+
* Returns the distance between two Spans
|
|
117
|
+
*
|
|
118
|
+
* @todo Use graph to find prev and next spans for a more accurate result
|
|
119
|
+
*
|
|
120
|
+
* @todo Or base 'distance' on word distance (slop) rather than characters
|
|
121
|
+
*/
|
|
122
|
+
distance(that) {
|
|
123
|
+
if (this.intersects(that))
|
|
124
|
+
return 0;
|
|
125
|
+
if (this.end < that.start) {
|
|
126
|
+
return that.start - this.end;
|
|
127
|
+
}
|
|
128
|
+
return this.start - that.end;
|
|
129
|
+
}
|
|
130
|
+
/**
|
|
131
|
+
* Returns the coverage of the span, i.e. the number of characters covered by the span and its
|
|
132
|
+
* children.
|
|
133
|
+
*/
|
|
134
|
+
get coverage() {
|
|
135
|
+
if (this.children.size) {
|
|
136
|
+
return (Iterator
|
|
137
|
+
// ---
|
|
138
|
+
.from(this.children)
|
|
139
|
+
.reduce((sum, child) => sum + (child.end - child.start), 0));
|
|
140
|
+
}
|
|
141
|
+
return this.end - this.start;
|
|
142
|
+
}
|
|
143
|
+
/**
|
|
144
|
+
* The combined languages of the span's children.
|
|
145
|
+
*/
|
|
146
|
+
get languages() {
|
|
147
|
+
// Spread children langs to the parent...
|
|
148
|
+
const languages = new Set();
|
|
149
|
+
const displayNames = new Set();
|
|
150
|
+
for (const child of this.children) {
|
|
151
|
+
for (const classification of child.classifications.values()) {
|
|
152
|
+
const childLanguages = classification.languages;
|
|
153
|
+
if (!childLanguages)
|
|
154
|
+
continue;
|
|
155
|
+
if (childLanguages.displayName) {
|
|
156
|
+
displayNames.add(childLanguages.displayName);
|
|
157
|
+
}
|
|
158
|
+
for (const language of childLanguages) {
|
|
159
|
+
languages.add(language);
|
|
160
|
+
}
|
|
161
|
+
}
|
|
162
|
+
}
|
|
163
|
+
languages.displayName = displayNames.size ? Array.from(displayNames).join(", ") : undefined;
|
|
164
|
+
return languages;
|
|
165
|
+
}
|
|
166
|
+
/**
|
|
167
|
+
* Serialize the span to JSON.
|
|
168
|
+
*/
|
|
169
|
+
toJSON() {
|
|
170
|
+
return {
|
|
171
|
+
// [kSpanID]: this.id,
|
|
172
|
+
body: this.body,
|
|
173
|
+
start: this.start,
|
|
174
|
+
end: this.end,
|
|
175
|
+
normalized: this.normalized,
|
|
176
|
+
classifications: this.classifications.toJSON(),
|
|
177
|
+
children: Iterator.from(this.children)
|
|
178
|
+
.map((c) => c.toJSON())
|
|
179
|
+
.toArray(),
|
|
180
|
+
phrases: Iterator.from(this.phrases)
|
|
181
|
+
.map((p) => p.toJSON())
|
|
182
|
+
.toArray(),
|
|
183
|
+
};
|
|
184
|
+
}
|
|
185
|
+
toString() {
|
|
186
|
+
const classifications = Array.from(this.classifications.keys()).join(", ");
|
|
187
|
+
const flags = Array.from(this.#flags).join(", ");
|
|
188
|
+
return `Span(${this.children.size}) "${this.body}" [${classifications}][${flags}]`;
|
|
189
|
+
}
|
|
190
|
+
[Symbol.for("nodejs.util.inspect.custom")]() {
|
|
191
|
+
return this.toString();
|
|
192
|
+
}
|
|
193
|
+
/**
|
|
194
|
+
* Connect siblings in the graph.
|
|
195
|
+
*/
|
|
196
|
+
static connectSiblings(...spans) {
|
|
197
|
+
for (const [i, span] of spans.entries()) {
|
|
198
|
+
if (spans[i - 1]) {
|
|
199
|
+
span.previousSiblings.add(spans[i - 1]);
|
|
200
|
+
}
|
|
201
|
+
if (spans[i + 1]) {
|
|
202
|
+
span.nextSiblings.add(spans[i + 1]);
|
|
203
|
+
}
|
|
204
|
+
}
|
|
205
|
+
return spans;
|
|
206
|
+
}
|
|
207
|
+
}
|
|
208
|
+
/**
|
|
209
|
+
* Patterns to test and apply classifications to spans.
|
|
210
|
+
*
|
|
211
|
+
* Note that order here is important, as the first pattern that matches will be used.
|
|
212
|
+
*/
|
|
213
|
+
export const PatternMatchers = [
|
|
214
|
+
// Entirely numeric, i.e. contains only digits.
|
|
215
|
+
[/^\d+$/, "numeric"],
|
|
216
|
+
// Entirely special characters, i.e. contains only punctuation, symbols, or other non-alphanumeric characters.
|
|
217
|
+
[/^[@&/\\#,+()$~%.!^'";:*?[\]<>{}]+$/, "punctuation"],
|
|
218
|
+
// Entirely alpha, i.e. contains only letters.
|
|
219
|
+
[/^[A-Za-z\W]+$/, "alpha"],
|
|
220
|
+
// Entirely alphanumeric, i.e. contains only letters and digits.
|
|
221
|
+
[/^[A-Za-z0-9\W]+$/, "alphanumeric"],
|
|
222
|
+
];
|
|
223
|
+
//# sourceMappingURL=Span.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"Span.js","sourceRoot":"","sources":["../../tokenization/Span.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,iGAAiG;AACjG,gGAAgG;AAChG,+FAA+F;AAC/F,wEAAwE;AACxE,OAAO,EAGN,uBAAuB,GACvB,MAAM,qCAAqC,CAAA;AAI5C,OAAO,EAAE,KAAK,EAAE,MAAM,YAAY,CAAA;AAElC,MAAM,eAAe,GAAG,GAAG,CAAA;AAQ3B,MAAM,OAAO,GAAkB,MAAM,CAAC,QAAQ,CAAC,CAAA;AAa/C;;GAEG;AACH,MAAM,OAAO,IAAK,SAAQ,KAAW;IACpC,KAAK,GAAW,EAAE,CAAA;IAClB;;OAEG;IACI,KAAK,CAAQ;IAEpB;;OAEG;IACI,GAAG,CAAS;IAEnB;;OAEG;IACO,MAAM,CAAC,SAAS,GAAG,CAAC,CAAA;IAE9B;;OAEG;IACM,CAAC,OAAO,CAAC,CAAS;IAE3B,IAAW,EAAE;QACZ,OAAO,IAAI,CAAC,OAAO,CAAC,CAAA;IACrB,CAAC;IAED;;OAEG;IACI,UAAU,GAAG,EAAE,CAAA;IAEtB;;OAEG;IACa,eAAe,GAA4B,IAAI,uBAAuB,EAAE,CAAA;IAE/E,MAAM,GAAG,IAAI,GAAG,EAAY,CAAA;IAErC;;;;OAIG;IACH,IAAW,KAAK;QACf,OAAO,IAAI,CAAC,MAAM,CAAA;IACnB,CAAC;IAEM,EAAE,CAAC,cAA8B;QACvC,OAAO,IAAI,CAAC,eAAe,CAAC,GAAG,CAAC,cAAc,CAAC,CAAA;IAChD,CAAC;IAKD,MAAM,CAAC,IAAI,CAAC,QAAuB,EAAE,EAAE,UAA+B,EAAE;QACvE,MAAM,IAAI,GAAG,KAAK,YAAY,IAAI,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,IAAI,IAAI,CAAC,KAAK,EAAE,OAAO,CAAC,KAAK,CAAC,CAAA;QAE3E,KAAK,MAAM,cAAc,IAAI,OAAO,CAAC,eAAe,IAAI,EAAE,EAAE,CAAC;YAC5D,IAAI,CAAC,eAAe,CAAC,GAAG,CAAC,cAAc,CAAC,CAAA;QACzC,CAAC;QAED,IAAI,CAAC,QAAQ,CAAC,GAAG,CAAC,GAAG,CAAC,OAAO,CAAC,QAAQ,IAAI,EAAE,CAAC,CAAC,CAAA;QAE9C,OAAO,IAAI,CAAA;IACZ,CAAC;IAED,YAAY,IAAI,GAAG,EAAE,EAAE,KAAK,GAAG,CAAC;QAC/B,KAAK,EAAE,CAAA;QAEP,mCAAmC;QACnC,MAAM,CAAC,cAAc,CAAC,IAAI,EAAE,OAAO,EAAE;YACpC,KAAK,EAAE,IAAI,CAAC,SAAS,EAAE;YACvB,QAAQ,EAAE,KAAK;YACf,UAAU,EAAE,KAAK;YACjB,YAAY,EAAE,KAAK;SACnB,CAAC,CAAA;QAEF,sFAAsF;QACtF,IAAI,CAAC,KAAK,GAAG,KAAK,CAAA;QAClB,IAAI,CAAC,IAAI,GAAG,IAAI,CAAA;IACjB,CAAC;IAED,IAAI,IAAI;QACP,OAAO,IAAI,CAAC,KAAK,CAAA;IAClB,CAAC;IAED;;OAEG;IACH,IAAI,IAAI,CAAC,QAAgB;QACxB,IAAI,CAAC,MAAM,CAAC,KAAK,EAAE,CAAA;QACnB,IAAI,CAAC,KAAK,GAAG,QAAQ,CAAC,KAAK,CAAC,CAAC,EAAE,eAAe,CAAC,CAAA;QAE/C,IAAI,CAAC,UAAU,GAAG,IAAI,CAAC,KAAK,CAAC,WAAW,EAAE,CAAA;QAC1C,IAAI,CAAC,GAAG,GAAG,IAAI,CAAC,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC,MAAM,CAAA;QAEzC,KAAK,MAAM,CAAC,OAAO,EAAE,IAAI,CAAC,IAAI,eAAe,EAAE,CAAC;YAC/C,IAAI,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,UAAU,CAAC,EAAE,CAAC;gBACnC,IAAI,CAAC,MAAM,CAAC,GAAG,CAAC,IAAI,CAAC,CAAA;gBAErB,MAAK;YACN,CAAC;QACF,CAAC;QAED,IAAI,IAAI,CAAC,KAAK,CAAC,GAAG,CAAC,SAAS,CAAC,IAAI,IAAI,CAAC,KAAK,CAAC,GAAG,CAAC,cAAc,CAAC,EAAE,CAAC;YACjE,IAAI,CAAC,MAAM,CAAC,GAAG,CAAC,SAAS,CAAC,CAAA;QAC3B,CAAC;QAED,IAAI,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC,KAAK,GAAG,EAAE,CAAC;YAClC,IAAI,CAAC,MAAM,CAAC,GAAG,CAAC,kBAAkB,CAAC,CAAA;QACpC,CAAC;IACF,CAAC;IAED;;OAEG;IACI,UAAU,CAAC,IAAiC;QAClD,OAAO,IAAI,CAAC,KAAK,GAAG,IAAI,CAAC,GAAG,IAAI,IAAI,CAAC,GAAG,GAAG,IAAI,CAAC,KAAK,CAAA;IACtD,CAAC;IAED;;OAEG;IACI,MAAM,CAAC,IAAiC;QAC9C,OAAO,IAAI,CAAC,KAAK,IAAI,IAAI,CAAC,KAAK,IAAI,IAAI,CAAC,GAAG,IAAI,IAAI,CAAC,GAAG,CAAA;IACxD,CAAC;IAED;;;;;;OAMG;IACI,QAAQ,CAAC,IAAiC;QAChD,IAAI,IAAI,CAAC,UAAU,CAAC,IAAI,CAAC;YAAE,OAAO,CAAC,CAAA;QAEnC,IAAI,IAAI,CAAC,GAAG,GAAG,IAAI,CAAC,KAAK,EAAE,CAAC;YAC3B,OAAO,IAAI,CAAC,KAAK,GAAG,IAAI,CAAC,GAAG,CAAA;QAC7B,CAAC;QACD,OAAO,IAAI,CAAC,KAAK,GAAG,IAAI,CAAC,GAAG,CAAA;IAC7B,CAAC;IAED;;;OAGG;IACH,IAAW,QAAQ;QAClB,IAAI,IAAI,CAAC,QAAQ,CAAC,IAAI,EAAE,CAAC;YACxB,OAAO,CACN,QAAQ;gBACP,MAAM;iBACL,IAAI,CAAC,IAAI,CAAC,QAAQ,CAAC;iBACnB,MAAM,CAAC,CAAC,GAAG,EAAE,KAAK,EAAE,EAAE,CAAC,GAAG,GAAG,CAAC,KAAK,CAAC,GAAG,GAAG,KAAK,CAAC,KAAK,CAAC,EAAE,CAAC,CAAC,CAC5D,CAAA;QACF,CAAC;QACD,OAAO,IAAI,CAAC,GAAG,GAAG,IAAI,CAAC,KAAK,CAAA;IAC7B,CAAC;IAED;;OAEG;IACH,IAAW,SAAS;QACnB,yCAAyC;QACzC,MAAM,SAAS,GAAkE,IAAI,GAAG,EAAE,CAAA;QAC1F,MAAM,YAAY,GAAG,IAAI,GAAG,EAAU,CAAA;QAEtC,KAAK,MAAM,KAAK,IAAI,IAAI,CAAC,QAAQ,EAAE,CAAC;YACnC,KAAK,MAAM,cAAc,IAAI,KAAK,CAAC,eAAe,CAAC,MAAM,EAAE,EAAE,CAAC;gBAC7D,MAAM,cAAc,GAAG,cAAc,CAAC,SAAS,CAAA;gBAE/C,IAAI,CAAC,cAAc;oBAAE,SAAQ;gBAE7B,IAAI,cAAc,CAAC,WAAW,EAAE,CAAC;oBAChC,YAAY,CAAC,GAAG,CAAC,cAAc,CAAC,WAAW,CAAC,CAAA;gBAC7C,CAAC;gBAED,KAAK,MAAM,QAAQ,IAAI,cAAc,EAAE,CAAC;oBACvC,SAAS,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAA;gBACxB,CAAC;YACF,CAAC;QACF,CAAC;QAED,SAAS,CAAC,WAAW,GAAG,YAAY,CAAC,IAAI,CAAC,CAAC,CAAC,KAAK,CAAC,IAAI,CAAC,YAAY,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC,SAAS,CAAA;QAE3F,OAAO,SAAS,CAAA;IACjB,CAAC;IAED;;OAEG;IACI,MAAM;QACZ,OAAO;YACN,sBAAsB;YACtB,IAAI,EAAE,IAAI,CAAC,IAAI;YACf,KAAK,EAAE,IAAI,CAAC,KAAK;YACjB,GAAG,EAAE,IAAI,CAAC,GAAG;YACb,UAAU,EAAE,IAAI,CAAC,UAAU;YAC3B,eAAe,EAAE,IAAI,CAAC,eAAe,CAAC,MAAM,EAAE;YAC9C,QAAQ,EAAE,QAAQ,CAAC,IAAI,CAAC,IAAI,CAAC,QAAQ,CAAC;iBACpC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,MAAM,EAAE,CAAC;iBACtB,OAAO,EAAE;YACX,OAAO,EAAE,QAAQ,CAAC,IAAI,CAAC,IAAI,CAAC,OAAO,CAAC;iBAClC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,MAAM,EAAE,CAAC;iBACtB,OAAO,EAAE;SACc,CAAA;IAC3B,CAAC;IAEe,QAAQ;QACvB,MAAM,eAAe,GAAG,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,eAAe,CAAC,IAAI,EAAE,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAA;QAC1E,MAAM,KAAK,GAAG,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAA;QAEhD,OAAO,QAAQ,IAAI,CAAC,QAAQ,CAAC,IAAI,MAAM,IAAI,CAAC,IAAI,MAAM,eAAe,KAAK,KAAK,GAAG,CAAA;IACnF,CAAC;IAEM,CAAC,MAAM,CAAC,GAAG,CAAC,4BAA4B,CAAC,CAAC;QAChD,OAAO,IAAI,CAAC,QAAQ,EAAE,CAAA;IACvB,CAAC;IAED;;OAEG;IACH,MAAM,CAAC,eAAe,CAAC,GAAG,KAAa;QACtC,KAAK,MAAM,CAAC,CAAC,EAAE,IAAI,CAAC,IAAI,KAAK,CAAC,OAAO,EAAE,EAAE,CAAC;YACzC,IAAI,KAAK,CAAC,CAAC,GAAG,CAAC,CAAC,EAAE,CAAC;gBAClB,IAAI,CAAC,gBAAgB,CAAC,GAAG,CAAC,KAAK,CAAC,CAAC,GAAG,CAAC,CAAE,CAAC,CAAA;YACzC,CAAC;YAED,IAAI,KAAK,CAAC,CAAC,GAAG,CAAC,CAAC,EAAE,CAAC;gBAClB,IAAI,CAAC,YAAY,CAAC,GAAG,CAAC,KAAK,CAAC,CAAC,GAAG,CAAC,CAAE,CAAC,CAAA;YACrC,CAAC;QACF,CAAC;QAED,OAAO,KAAK,CAAA;IACb,CAAC;;AAKF;;;;GAIG;AACH,MAAM,CAAC,MAAM,eAAe,GAAiD;IAC5E,+CAA+C;IAC/C,CAAC,OAAO,EAAE,SAAS,CAAC;IAEpB,8GAA8G;IAC9G,CAAC,oCAAoC,EAAE,aAAa,CAAC;IAErD,8CAA8C;IAC9C,CAAC,eAAe,EAAE,OAAO,CAAC;IAE1B,gEAAgE;IAChE,CAAC,kBAAkB,EAAE,cAAc,CAAC;CACpC,CAAA"}
|
|
@@ -0,0 +1,39 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
import { type SerializedSolution, type Solution } from "@mailwoman/core/solver";
|
|
7
|
+
import { type SerializedSpan, Span } from "./Span.js";
|
|
8
|
+
export interface SerializedTokenContext {
|
|
9
|
+
span: SerializedSpan;
|
|
10
|
+
solutions: SerializedSolution[];
|
|
11
|
+
sections: SerializedSpan[];
|
|
12
|
+
readonly coverage: number;
|
|
13
|
+
}
|
|
14
|
+
/**
|
|
15
|
+
* Tokenizes a string into sections and phrases.
|
|
16
|
+
*/
|
|
17
|
+
export declare class TokenContext {
|
|
18
|
+
#private;
|
|
19
|
+
get solutions(): Solution[];
|
|
20
|
+
set solutions(nextSolutions: Solution[]);
|
|
21
|
+
get span(): Span;
|
|
22
|
+
/**
|
|
23
|
+
* Sections of the tokenization.
|
|
24
|
+
*/
|
|
25
|
+
get sections(): Span[];
|
|
26
|
+
constructor(input?: string);
|
|
27
|
+
/**
|
|
28
|
+
* Evaluate and rank the solutions.
|
|
29
|
+
*
|
|
30
|
+
* This method is called after the solver has generated solutions, modifying the solutions
|
|
31
|
+
* in-place.
|
|
32
|
+
*/
|
|
33
|
+
evaluateAndRank(solutionLimit: number): void;
|
|
34
|
+
/**
|
|
35
|
+
* Serialize the tokenizer.
|
|
36
|
+
*/
|
|
37
|
+
toJSON(): SerializedTokenContext;
|
|
38
|
+
}
|
|
39
|
+
//# sourceMappingURL=context.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"context.d.ts","sourceRoot":"","sources":["../../tokenization/context.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,EAGN,KAAK,kBAAkB,EACvB,KAAK,QAAQ,EACb,MAAM,wBAAwB,CAAA;AAE/B,OAAO,EAAE,KAAK,cAAc,EAAE,IAAI,EAAE,MAAM,WAAW,CAAA;AAGrD,MAAM,WAAW,sBAAsB;IACtC,IAAI,EAAE,cAAc,CAAA;IACpB,SAAS,EAAE,kBAAkB,EAAE,CAAA;IAC/B,QAAQ,EAAE,cAAc,EAAE,CAAA;IAC1B,QAAQ,CAAC,QAAQ,EAAE,MAAM,CAAA;CACzB;AAED;;GAEG;AACH,qBAAa,YAAY;;IAOxB,IAAW,SAAS,IAAI,QAAQ,EAAE,CAEjC;IAED,IAAW,SAAS,CAAC,aAAa,EAAE,QAAQ,EAAE,EAW7C;IAED,IAAW,IAAI,IAAI,IAAI,CAEtB;IAED;;OAEG;IACH,IAAW,QAAQ,IAAI,IAAI,EAAE,CAE5B;gBAEW,KAAK,GAAE,MAAW;IAuB9B;;;;;OAKG;IACI,eAAe,CAAC,aAAa,EAAE,MAAM,GAAG,IAAI;IAkBnD;;OAEG;IACI,MAAM,IAAI,sBAAsB;CAQvC"}
|
|
@@ -0,0 +1,114 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
import { compareMatchesByStart, rankingSolutionsByAreaClassification, } from "@mailwoman/core/solver";
|
|
7
|
+
import { permutate } from "./permutate.js";
|
|
8
|
+
import { Span } from "./Span.js";
|
|
9
|
+
import { fieldsFuncBoundary, fieldsFuncHyphenOrWhiteSpace, fieldsFuncWhiteSpace, splitByField } from "./split.js";
|
|
10
|
+
/**
|
|
11
|
+
* Tokenizes a string into sections and phrases.
|
|
12
|
+
*/
|
|
13
|
+
export class TokenContext {
|
|
14
|
+
#span;
|
|
15
|
+
#sections = [];
|
|
16
|
+
#coverage = 0;
|
|
17
|
+
#solutions = [];
|
|
18
|
+
get solutions() {
|
|
19
|
+
return this.#solutions;
|
|
20
|
+
}
|
|
21
|
+
set solutions(nextSolutions) {
|
|
22
|
+
// if (this.#solutions.length && nextSolutions.length < this.#solutions.length) {
|
|
23
|
+
// console.log(`--------------------------------------`)
|
|
24
|
+
// console.log(`${this.#solutions.length} Solution(s)`)
|
|
25
|
+
// for (const [i, solution] of this.#solutions.entries()) {
|
|
26
|
+
// console.log(`Solution ${i + 1}`, solution.toJSON())
|
|
27
|
+
// }
|
|
28
|
+
// }
|
|
29
|
+
this.#solutions = nextSolutions;
|
|
30
|
+
}
|
|
31
|
+
get span() {
|
|
32
|
+
return this.#span;
|
|
33
|
+
}
|
|
34
|
+
/**
|
|
35
|
+
* Sections of the tokenization.
|
|
36
|
+
*/
|
|
37
|
+
get sections() {
|
|
38
|
+
return this.#sections;
|
|
39
|
+
}
|
|
40
|
+
constructor(input = "") {
|
|
41
|
+
this.#span = Span.from(input);
|
|
42
|
+
// Split the input into sections.
|
|
43
|
+
const sections = splitByField(this.#span, fieldsFuncBoundary);
|
|
44
|
+
for (const section of sections) {
|
|
45
|
+
// Then, split each section into phrases.
|
|
46
|
+
section.children.add(...splitByField(section, fieldsFuncWhiteSpace));
|
|
47
|
+
section.children.add(...splitByField(section, fieldsFuncHyphenOrWhiteSpace));
|
|
48
|
+
}
|
|
49
|
+
this.#sections = sections;
|
|
50
|
+
this.#coverage = computeCoverage(sections);
|
|
51
|
+
// Permute the phrases of each section.
|
|
52
|
+
for (const section of this.sections) {
|
|
53
|
+
const permutations = permutate(section.children, { from: 0, to: 10 });
|
|
54
|
+
section.phrases.add(...permutations);
|
|
55
|
+
}
|
|
56
|
+
}
|
|
57
|
+
/**
|
|
58
|
+
* Evaluate and rank the solutions.
|
|
59
|
+
*
|
|
60
|
+
* This method is called after the solver has generated solutions, modifying the solutions
|
|
61
|
+
* in-place.
|
|
62
|
+
*/
|
|
63
|
+
evaluateAndRank(solutionLimit) {
|
|
64
|
+
if (this.#solutions.length === 0)
|
|
65
|
+
return;
|
|
66
|
+
for (const solution of this.#solutions) {
|
|
67
|
+
// Re-compute scores.
|
|
68
|
+
solution.computeScore(this.#coverage);
|
|
69
|
+
// Re-sort matches.
|
|
70
|
+
solution.matches.sort(compareMatchesByStart);
|
|
71
|
+
}
|
|
72
|
+
// Re-sort the solutions.
|
|
73
|
+
this.#solutions.sort(rankingSolutionsByAreaClassification);
|
|
74
|
+
// Finally, we keep only the best solutions.
|
|
75
|
+
this.#solutions = this.#solutions.slice(0, solutionLimit);
|
|
76
|
+
}
|
|
77
|
+
/**
|
|
78
|
+
* Serialize the tokenizer.
|
|
79
|
+
*/
|
|
80
|
+
toJSON() {
|
|
81
|
+
return {
|
|
82
|
+
span: this.span.toJSON(),
|
|
83
|
+
sections: this.sections.map((s) => s.toJSON()),
|
|
84
|
+
solutions: this.#solutions.map((s) => s.toJSON()),
|
|
85
|
+
coverage: this.#coverage,
|
|
86
|
+
};
|
|
87
|
+
}
|
|
88
|
+
}
|
|
89
|
+
/**
|
|
90
|
+
* Compute the coverage of the tokenization.
|
|
91
|
+
*/
|
|
92
|
+
function computeCoverageRec(sum, currentSpan) {
|
|
93
|
+
if (!currentSpan)
|
|
94
|
+
return sum;
|
|
95
|
+
sum += currentSpan.end - currentSpan.start;
|
|
96
|
+
if (currentSpan.end < currentSpan.start) {
|
|
97
|
+
throw new Error(`Tokenizer: invalid span ${currentSpan.start} ${currentSpan.end}`);
|
|
98
|
+
}
|
|
99
|
+
return computeCoverageRec(sum, currentSpan.nextSibling);
|
|
100
|
+
}
|
|
101
|
+
/**
|
|
102
|
+
* Compute the coverage of the tokenization.
|
|
103
|
+
*/
|
|
104
|
+
function computeCoverage(sections) {
|
|
105
|
+
let coverage = 0;
|
|
106
|
+
for (const [i, section] of sections.entries()) {
|
|
107
|
+
const firstChild = section.children.first;
|
|
108
|
+
if (!firstChild)
|
|
109
|
+
throw new Error(`Tokenizer: section ${i} has no children`);
|
|
110
|
+
coverage += computeCoverageRec(0, firstChild);
|
|
111
|
+
}
|
|
112
|
+
return coverage;
|
|
113
|
+
}
|
|
114
|
+
//# sourceMappingURL=context.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"context.js","sourceRoot":"","sources":["../../tokenization/context.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,EACN,qBAAqB,EACrB,oCAAoC,GAGpC,MAAM,wBAAwB,CAAA;AAC/B,OAAO,EAAE,SAAS,EAAE,MAAM,gBAAgB,CAAA;AAC1C,OAAO,EAAuB,IAAI,EAAE,MAAM,WAAW,CAAA;AACrD,OAAO,EAAE,kBAAkB,EAAE,4BAA4B,EAAE,oBAAoB,EAAE,YAAY,EAAE,MAAM,YAAY,CAAA;AASjH;;GAEG;AACH,MAAM,OAAO,YAAY;IACxB,KAAK,CAAO;IACZ,SAAS,GAAW,EAAE,CAAA;IACtB,SAAS,GAAW,CAAC,CAAA;IAErB,UAAU,GAAe,EAAE,CAAA;IAE3B,IAAW,SAAS;QACnB,OAAO,IAAI,CAAC,UAAU,CAAA;IACvB,CAAC;IAED,IAAW,SAAS,CAAC,aAAyB;QAC7C,iFAAiF;QACjF,yDAAyD;QACzD,wDAAwD;QAExD,4DAA4D;QAC5D,wDAAwD;QACxD,KAAK;QACL,IAAI;QAEJ,IAAI,CAAC,UAAU,GAAG,aAAa,CAAA;IAChC,CAAC;IAED,IAAW,IAAI;QACd,OAAO,IAAI,CAAC,KAAK,CAAA;IAClB,CAAC;IAED;;OAEG;IACH,IAAW,QAAQ;QAClB,OAAO,IAAI,CAAC,SAAS,CAAA;IACtB,CAAC;IAED,YAAY,QAAgB,EAAE;QAC7B,IAAI,CAAC,KAAK,GAAG,IAAI,CAAC,IAAI,CAAC,KAAK,CAAC,CAAA;QAE7B,iCAAiC;QACjC,MAAM,QAAQ,GAAG,YAAY,CAAC,IAAI,CAAC,KAAK,EAAE,kBAAkB,CAAC,CAAA;QAE7D,KAAK,MAAM,OAAO,IAAI,QAAQ,EAAE,CAAC;YAChC,yCAAyC;YACzC,OAAO,CAAC,QAAQ,CAAC,GAAG,CAAC,GAAG,YAAY,CAAC,OAAO,EAAE,oBAAoB,CAAC,CAAC,CAAA;YACpE,OAAO,CAAC,QAAQ,CAAC,GAAG,CAAC,GAAG,YAAY,CAAC,OAAO,EAAE,4BAA4B,CAAC,CAAC,CAAA;QAC7E,CAAC;QAED,IAAI,CAAC,SAAS,GAAG,QAAQ,CAAA;QACzB,IAAI,CAAC,SAAS,GAAG,eAAe,CAAC,QAAQ,CAAC,CAAA;QAE1C,uCAAuC;QACvC,KAAK,MAAM,OAAO,IAAI,IAAI,CAAC,QAAQ,EAAE,CAAC;YACrC,MAAM,YAAY,GAAG,SAAS,CAAC,OAAO,CAAC,QAAQ,EAAE,EAAE,IAAI,EAAE,CAAC,EAAE,EAAE,EAAE,EAAE,EAAE,CAAC,CAAA;YAErE,OAAO,CAAC,OAAO,CAAC,GAAG,CAAC,GAAG,YAAY,CAAC,CAAA;QACrC,CAAC;IACF,CAAC;IAED;;;;;OAKG;IACI,eAAe,CAAC,aAAqB;QAC3C,IAAI,IAAI,CAAC,UAAU,CAAC,MAAM,KAAK,CAAC;YAAE,OAAM;QAExC,KAAK,MAAM,QAAQ,IAAI,IAAI,CAAC,UAAU,EAAE,CAAC;YACxC,qBAAqB;YACrB,QAAQ,CAAC,YAAY,CAAC,IAAI,CAAC,SAAS,CAAC,CAAA;YAErC,mBAAmB;YACnB,QAAQ,CAAC,OAAO,CAAC,IAAI,CAAC,qBAAqB,CAAC,CAAA;QAC7C,CAAC;QAED,yBAAyB;QACzB,IAAI,CAAC,UAAU,CAAC,IAAI,CAAC,oCAAoC,CAAC,CAAA;QAE1D,4CAA4C;QAC5C,IAAI,CAAC,UAAU,GAAG,IAAI,CAAC,UAAU,CAAC,KAAK,CAAC,CAAC,EAAE,aAAa,CAAC,CAAA;IAC1D,CAAC;IAED;;OAEG;IACI,MAAM;QACZ,OAAO;YACN,IAAI,EAAE,IAAI,CAAC,IAAI,CAAC,MAAM,EAAE;YACxB,QAAQ,EAAE,IAAI,CAAC,QAAQ,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,MAAM,EAAE,CAAC;YAC9C,SAAS,EAAE,IAAI,CAAC,UAAU,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,MAAM,EAAE,CAAC;YACjD,QAAQ,EAAE,IAAI,CAAC,SAAS;SACxB,CAAA;IACF,CAAC;CACD;AAED;;GAEG;AACH,SAAS,kBAAkB,CAAC,GAAW,EAAE,WAAwB;IAChE,IAAI,CAAC,WAAW;QAAE,OAAO,GAAG,CAAA;IAE5B,GAAG,IAAI,WAAW,CAAC,GAAG,GAAG,WAAW,CAAC,KAAK,CAAA;IAE1C,IAAI,WAAW,CAAC,GAAG,GAAG,WAAW,CAAC,KAAK,EAAE,CAAC;QACzC,MAAM,IAAI,KAAK,CAAC,2BAA2B,WAAW,CAAC,KAAK,IAAI,WAAW,CAAC,GAAG,EAAE,CAAC,CAAA;IACnF,CAAC;IAED,OAAO,kBAAkB,CAAC,GAAG,EAAE,WAAW,CAAC,WAAW,CAAC,CAAA;AACxD,CAAC;AAED;;GAEG;AACH,SAAS,eAAe,CAAC,QAAgB;IACxC,IAAI,QAAQ,GAAG,CAAC,CAAA;IAEhB,KAAK,MAAM,CAAC,CAAC,EAAE,OAAO,CAAC,IAAI,QAAQ,CAAC,OAAO,EAAE,EAAE,CAAC;QAC/C,MAAM,UAAU,GAAG,OAAO,CAAC,QAAQ,CAAC,KAAK,CAAA;QAEzC,IAAI,CAAC,UAAU;YAAE,MAAM,IAAI,KAAK,CAAC,sBAAsB,CAAC,kBAAkB,CAAC,CAAA;QAE3E,QAAQ,IAAI,kBAAkB,CAAC,CAAC,EAAE,UAAU,CAAC,CAAA;IAC9C,CAAC;IAED,OAAO,QAAQ,CAAA;AAChB,CAAC"}
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
export * from "./context.js";
|
|
7
|
+
export * from "./Graph.js";
|
|
8
|
+
export * from "./normalizer.js";
|
|
9
|
+
export * from "./permutate.js";
|
|
10
|
+
export * from "./Span.js";
|
|
11
|
+
//# sourceMappingURL=index.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../tokenization/index.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,cAAc,cAAc,CAAA;AAC5B,cAAc,YAAY,CAAA;AAC1B,cAAc,iBAAiB,CAAA;AAC/B,cAAc,gBAAgB,CAAA;AAC9B,cAAc,WAAW,CAAA"}
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* @copyright Sister Software
|
|
3
|
+
* @license AGPL-3.0
|
|
4
|
+
* @author Teffen Ellis, et al.
|
|
5
|
+
*/
|
|
6
|
+
export * from "./context.js";
|
|
7
|
+
export * from "./Graph.js";
|
|
8
|
+
export * from "./normalizer.js";
|
|
9
|
+
export * from "./permutate.js";
|
|
10
|
+
export * from "./Span.js";
|
|
11
|
+
//# sourceMappingURL=index.js.map
|