pubid 1.15.19 → 2.0.0.pre.alpha.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (601) hide show
  1. checksums.yaml +4 -4
  2. data/LICENSE.txt +1 -1
  3. data/README.adoc +2041 -53
  4. data/archived-gems/pubid-ccsds/update_codes.yaml +1 -0
  5. data/archived-gems/pubid-iec/stages.yaml +129 -0
  6. data/archived-gems/pubid-iec/update_codes.yaml +67 -0
  7. data/archived-gems/pubid-ieee/update_codes.yaml +104 -0
  8. data/archived-gems/pubid-iso/stages.yaml +106 -0
  9. data/archived-gems/pubid-iso/update_codes.yaml +4 -0
  10. data/archived-gems/pubid-itu/i18n.yaml +13 -0
  11. data/archived-gems/pubid-itu/series.yaml +42 -0
  12. data/archived-gems/pubid-nist/publishers.yaml +6 -0
  13. data/archived-gems/pubid-nist/series.yaml +121 -0
  14. data/archived-gems/pubid-nist/stages.yaml +16 -0
  15. data/archived-gems/pubid-nist/update_codes.yaml +93 -0
  16. data/archived-gems/pubid-plateau/update_codes.yaml +6 -0
  17. data/data/ccsds/update_codes.yaml +1 -0
  18. data/data/iec/update_codes.yaml +67 -0
  19. data/data/ieee/update_codes.yaml +104 -0
  20. data/data/iso/update_codes.yaml +21 -0
  21. data/data/nist/update_codes.yaml +87 -0
  22. data/data/plateau/update_codes.yaml +6 -0
  23. data/lib/pubid/amca/builder.rb +176 -0
  24. data/lib/pubid/amca/identifier.rb +18 -0
  25. data/lib/pubid/amca/identifiers/base.rb +64 -0
  26. data/lib/pubid/amca/identifiers/interpretation.rb +51 -0
  27. data/lib/pubid/amca/identifiers/publication.rb +47 -0
  28. data/lib/pubid/amca/identifiers/standard.rb +22 -0
  29. data/lib/pubid/amca/identifiers.rb +12 -0
  30. data/lib/pubid/amca/parser.rb +153 -0
  31. data/lib/pubid/amca/scheme.rb +16 -0
  32. data/lib/pubid/amca/single_identifier.rb +33 -0
  33. data/lib/pubid/amca/urn_generator.rb +50 -0
  34. data/lib/pubid/amca.rb +26 -0
  35. data/lib/pubid/ansi/builder.rb +52 -0
  36. data/lib/pubid/ansi/identifier.rb +13 -0
  37. data/lib/pubid/ansi/identifiers/american_national_standard.rb +12 -0
  38. data/lib/pubid/ansi/identifiers/standard.rb +16 -0
  39. data/lib/pubid/ansi/identifiers.rb +11 -0
  40. data/lib/pubid/ansi/parser.rb +91 -0
  41. data/lib/pubid/ansi/scheme.rb +15 -0
  42. data/lib/pubid/ansi/single_identifier.rb +45 -0
  43. data/lib/pubid/ansi/urn_generator.rb +76 -0
  44. data/lib/pubid/ansi.rb +27 -0
  45. data/lib/pubid/api/builder.rb +85 -0
  46. data/lib/pubid/api/components/code.rb +9 -0
  47. data/lib/pubid/api/identifier.rb +21 -0
  48. data/lib/pubid/api/identifiers/base.rb +24 -0
  49. data/lib/pubid/api/identifiers/bulletin.rb +15 -0
  50. data/lib/pubid/api/identifiers/continuous_operations_standard.rb +15 -0
  51. data/lib/pubid/api/identifiers/mpms.rb +44 -0
  52. data/lib/pubid/api/identifiers/publication.rb +15 -0
  53. data/lib/pubid/api/identifiers/recommended_practice.rb +15 -0
  54. data/lib/pubid/api/identifiers/specification.rb +15 -0
  55. data/lib/pubid/api/identifiers/standard.rb +15 -0
  56. data/lib/pubid/api/identifiers/technical_report.rb +15 -0
  57. data/lib/pubid/api/identifiers/typeless_standard.rb +27 -0
  58. data/lib/pubid/api/parser.rb +140 -0
  59. data/lib/pubid/api/scheme.rb +66 -0
  60. data/lib/pubid/api/single_identifier.rb +46 -0
  61. data/lib/pubid/api/urn_generator.rb +41 -0
  62. data/lib/pubid/api.rb +17 -0
  63. data/lib/pubid/ashrae/builder.rb +498 -0
  64. data/lib/pubid/ashrae/identifier.rb +18 -0
  65. data/lib/pubid/ashrae/identifiers/addenda_package.rb +46 -0
  66. data/lib/pubid/ashrae/identifiers/addendum.rb +55 -0
  67. data/lib/pubid/ashrae/identifiers/base.rb +23 -0
  68. data/lib/pubid/ashrae/identifiers/combined_addenda.rb +51 -0
  69. data/lib/pubid/ashrae/identifiers/errata.rb +40 -0
  70. data/lib/pubid/ashrae/identifiers/guideline.rb +38 -0
  71. data/lib/pubid/ashrae/identifiers/interpretation.rb +39 -0
  72. data/lib/pubid/ashrae/identifiers/standard.rb +38 -0
  73. data/lib/pubid/ashrae/identifiers.rb +16 -0
  74. data/lib/pubid/ashrae/parser.rb +724 -0
  75. data/lib/pubid/ashrae/scheme.rb +53 -0
  76. data/lib/pubid/ashrae/single_identifier.rb +23 -0
  77. data/lib/pubid/ashrae/supplement_identifier.rb +23 -0
  78. data/lib/pubid/ashrae/urn_generator.rb +59 -0
  79. data/lib/pubid/ashrae.rb +21 -0
  80. data/lib/pubid/asme/builder.rb +153 -0
  81. data/lib/pubid/asme/components/code.rb +18 -0
  82. data/lib/pubid/asme/identifier.rb +15 -0
  83. data/lib/pubid/asme/identifiers/base.rb +70 -0
  84. data/lib/pubid/asme/identifiers/standard.rb +12 -0
  85. data/lib/pubid/asme/identifiers.rb +10 -0
  86. data/lib/pubid/asme/parser.rb +308 -0
  87. data/lib/pubid/asme/scheme.rb +37 -0
  88. data/lib/pubid/asme/single_identifier.rb +29 -0
  89. data/lib/pubid/asme/urn_generator.rb +133 -0
  90. data/lib/pubid/asme.rb +21 -0
  91. data/lib/pubid/astm/builder.rb +159 -0
  92. data/lib/pubid/astm/components/code.rb +33 -0
  93. data/lib/pubid/astm/identifier.rb +15 -0
  94. data/lib/pubid/astm/identifiers/adjunct.rb +21 -0
  95. data/lib/pubid/astm/identifiers/base.rb +13 -0
  96. data/lib/pubid/astm/identifiers/data_series.rb +25 -0
  97. data/lib/pubid/astm/identifiers/iso_dual_published.rb +74 -0
  98. data/lib/pubid/astm/identifiers/manual.rb +40 -0
  99. data/lib/pubid/astm/identifiers/monograph.rb +25 -0
  100. data/lib/pubid/astm/identifiers/research_report.rb +18 -0
  101. data/lib/pubid/astm/identifiers/standard.rb +52 -0
  102. data/lib/pubid/astm/identifiers/technical_report.rb +23 -0
  103. data/lib/pubid/astm/identifiers/work_in_progress.rb +21 -0
  104. data/lib/pubid/astm/parser.rb +244 -0
  105. data/lib/pubid/astm/scheme.rb +55 -0
  106. data/lib/pubid/astm/single_identifier.rb +25 -0
  107. data/lib/pubid/astm/urn_generator.rb +99 -0
  108. data/lib/pubid/astm.rb +38 -0
  109. data/lib/pubid/bsi/builder.rb +1483 -0
  110. data/lib/pubid/bsi/components/code.rb +11 -0
  111. data/lib/pubid/bsi/components/date.rb +11 -0
  112. data/lib/pubid/bsi/components/publisher.rb +11 -0
  113. data/lib/pubid/bsi/components/type.rb +11 -0
  114. data/lib/pubid/bsi/identifier.rb +27 -0
  115. data/lib/pubid/bsi/identifiers/addendum_document.rb +64 -0
  116. data/lib/pubid/bsi/identifiers/adopted_european_norm.rb +95 -0
  117. data/lib/pubid/bsi/identifiers/adopted_international_standard.rb +82 -0
  118. data/lib/pubid/bsi/identifiers/aerospace_standard.rb +118 -0
  119. data/lib/pubid/bsi/identifiers/amendment.rb +40 -0
  120. data/lib/pubid/bsi/identifiers/base.rb +11 -0
  121. data/lib/pubid/bsi/identifiers/british_industrial_practice.rb +27 -0
  122. data/lib/pubid/bsi/identifiers/british_standard.rb +33 -0
  123. data/lib/pubid/bsi/identifiers/bundled_identifier.rb +114 -0
  124. data/lib/pubid/bsi/identifiers/committee_document.rb +51 -0
  125. data/lib/pubid/bsi/identifiers/consolidated_identifier.rb +152 -0
  126. data/lib/pubid/bsi/identifiers/corrigendum.rb +28 -0
  127. data/lib/pubid/bsi/identifiers/detailed_specification.rb +69 -0
  128. data/lib/pubid/bsi/identifiers/disc.rb +56 -0
  129. data/lib/pubid/bsi/identifiers/draft_document.rb +71 -0
  130. data/lib/pubid/bsi/identifiers/electronic_book.rb +52 -0
  131. data/lib/pubid/bsi/identifiers/expert_commentary.rb +47 -0
  132. data/lib/pubid/bsi/identifiers/explanatory_supplement.rb +82 -0
  133. data/lib/pubid/bsi/identifiers/flex.rb +61 -0
  134. data/lib/pubid/bsi/identifiers/handbook.rb +39 -0
  135. data/lib/pubid/bsi/identifiers/index.rb +62 -0
  136. data/lib/pubid/bsi/identifiers/method.rb +76 -0
  137. data/lib/pubid/bsi/identifiers/national_annex.rb +73 -0
  138. data/lib/pubid/bsi/identifiers/practice_guide.rb +27 -0
  139. data/lib/pubid/bsi/identifiers/publicly_available_specification.rb +79 -0
  140. data/lib/pubid/bsi/identifiers/published_document.rb +79 -0
  141. data/lib/pubid/bsi/identifiers/section.rb +62 -0
  142. data/lib/pubid/bsi/identifiers/set.rb +46 -0
  143. data/lib/pubid/bsi/identifiers/standalone_amendment.rb +40 -0
  144. data/lib/pubid/bsi/identifiers/supplement_document.rb +51 -0
  145. data/lib/pubid/bsi/identifiers/supplementary_index.rb +81 -0
  146. data/lib/pubid/bsi/identifiers/technical_specification.rb +79 -0
  147. data/lib/pubid/bsi/identifiers/test_method.rb +67 -0
  148. data/lib/pubid/bsi/identifiers/value_added_publication.rb +52 -0
  149. data/lib/pubid/bsi/identifiers.rb +52 -0
  150. data/lib/pubid/bsi/model.rb +196 -0
  151. data/lib/pubid/bsi/parser.rb +659 -0
  152. data/lib/pubid/bsi/scheme.rb +243 -0
  153. data/lib/pubid/bsi/single_identifier.rb +129 -0
  154. data/lib/pubid/bsi/urn_generator.rb +84 -0
  155. data/lib/pubid/bsi.rb +32 -0
  156. data/lib/pubid/builder/base.rb +138 -0
  157. data/lib/pubid/bundled_identifier.rb +126 -0
  158. data/lib/pubid/ccsds/builder.rb +56 -0
  159. data/lib/pubid/ccsds/identifier.rb +16 -0
  160. data/lib/pubid/ccsds/identifiers/base.rb +78 -0
  161. data/lib/pubid/ccsds/identifiers/base_BASE_88929.rb +70 -0
  162. data/lib/pubid/ccsds/identifiers/corrigendum.rb +39 -0
  163. data/lib/pubid/ccsds/identifiers.rb +10 -0
  164. data/lib/pubid/ccsds/parser.rb +71 -0
  165. data/lib/pubid/ccsds/scheme.rb +57 -0
  166. data/lib/pubid/ccsds/single_identifier.rb +74 -0
  167. data/lib/pubid/ccsds/supplement_identifier.rb +33 -0
  168. data/lib/pubid/ccsds/urn_generator.rb +115 -0
  169. data/lib/pubid/ccsds.rb +21 -0
  170. data/lib/pubid/cen_cenelec/builder.rb +330 -0
  171. data/lib/pubid/cen_cenelec/identifier.rb +15 -0
  172. data/lib/pubid/cen_cenelec/identifiers/adopted_european_norm.rb +40 -0
  173. data/lib/pubid/cen_cenelec/identifiers/amendment.rb +29 -0
  174. data/lib/pubid/cen_cenelec/identifiers/base.rb +75 -0
  175. data/lib/pubid/cen_cenelec/identifiers/cen_report.rb +28 -0
  176. data/lib/pubid/cen_cenelec/identifiers/cen_workshop_agreement.rb +27 -0
  177. data/lib/pubid/cen_cenelec/identifiers/cenelec_harmonization_document.rb +28 -0
  178. data/lib/pubid/cen_cenelec/identifiers/consolidated_identifier.rb +61 -0
  179. data/lib/pubid/cen_cenelec/identifiers/corrigendum.rb +35 -0
  180. data/lib/pubid/cen_cenelec/identifiers/european_norm.rb +41 -0
  181. data/lib/pubid/cen_cenelec/identifiers/european_prestandard.rb +37 -0
  182. data/lib/pubid/cen_cenelec/identifiers/european_specification.rb +28 -0
  183. data/lib/pubid/cen_cenelec/identifiers/fragment.rb +22 -0
  184. data/lib/pubid/cen_cenelec/identifiers/guide.rb +27 -0
  185. data/lib/pubid/cen_cenelec/identifiers/harmonization_document.rb +27 -0
  186. data/lib/pubid/cen_cenelec/identifiers/technical_report.rb +27 -0
  187. data/lib/pubid/cen_cenelec/identifiers/technical_specification.rb +35 -0
  188. data/lib/pubid/cen_cenelec/identifiers.rb +32 -0
  189. data/lib/pubid/cen_cenelec/parser.rb +144 -0
  190. data/lib/pubid/cen_cenelec/scheme.rb +164 -0
  191. data/lib/pubid/cen_cenelec/single_identifier.rb +130 -0
  192. data/lib/pubid/cen_cenelec/supplement_identifier.rb +48 -0
  193. data/lib/pubid/cen_cenelec/urn_generator.rb +129 -0
  194. data/lib/pubid/cen_cenelec.rb +21 -0
  195. data/lib/pubid/cie/builder.rb +399 -0
  196. data/lib/pubid/cie/components/code.rb +72 -0
  197. data/lib/pubid/cie/components/language.rb +58 -0
  198. data/lib/pubid/cie/identifier.rb +18 -0
  199. data/lib/pubid/cie/identifiers/bundle.rb +20 -0
  200. data/lib/pubid/cie/identifiers/conference.rb +32 -0
  201. data/lib/pubid/cie/identifiers/corrigendum.rb +40 -0
  202. data/lib/pubid/cie/identifiers/dual_published.rb +41 -0
  203. data/lib/pubid/cie/identifiers/identical.rb +64 -0
  204. data/lib/pubid/cie/identifiers/joint_published.rb +52 -0
  205. data/lib/pubid/cie/identifiers/standard.rb +58 -0
  206. data/lib/pubid/cie/identifiers/supplement.rb +45 -0
  207. data/lib/pubid/cie/identifiers/tutorial_bundle.rb +20 -0
  208. data/lib/pubid/cie/identifiers.rb +17 -0
  209. data/lib/pubid/cie/parser.rb +347 -0
  210. data/lib/pubid/cie/scheme.rb +64 -0
  211. data/lib/pubid/cie/single_identifier.rb +30 -0
  212. data/lib/pubid/cie/supplement_identifier.rb +26 -0
  213. data/lib/pubid/cie/urn_generator.rb +123 -0
  214. data/lib/pubid/cie.rb +28 -0
  215. data/lib/pubid/components/code.rb +33 -0
  216. data/lib/pubid/components/date.rb +49 -0
  217. data/lib/pubid/components/edition.rb +32 -0
  218. data/lib/pubid/components/language.rb +37 -0
  219. data/lib/pubid/components/locality.rb +10 -0
  220. data/lib/pubid/components/publisher.rb +36 -0
  221. data/lib/pubid/components/stage.rb +54 -0
  222. data/lib/pubid/components/type.rb +58 -0
  223. data/lib/pubid/components/typed_stage.rb +55 -0
  224. data/lib/pubid/components.rb +15 -0
  225. data/lib/pubid/core/pattern_doc_generator.rb +272 -0
  226. data/lib/pubid/core/update_codes.rb +77 -0
  227. data/lib/pubid/core.rb +8 -0
  228. data/lib/pubid/csa/builder.rb +671 -0
  229. data/lib/pubid/csa/components/code.rb +9 -0
  230. data/lib/pubid/csa/components.rb +9 -0
  231. data/lib/pubid/csa/composite_identifier.rb +27 -0
  232. data/lib/pubid/csa/identifier.rb +457 -0
  233. data/lib/pubid/csa/identifiers/base.rb +133 -0
  234. data/lib/pubid/csa/identifiers/bundled.rb +125 -0
  235. data/lib/pubid/csa/identifiers/canadian_adopted.rb +82 -0
  236. data/lib/pubid/csa/identifiers/cec.rb +129 -0
  237. data/lib/pubid/csa/identifiers/combined.rb +130 -0
  238. data/lib/pubid/csa/identifiers/csa_adopted.rb +78 -0
  239. data/lib/pubid/csa/identifiers/package.rb +65 -0
  240. data/lib/pubid/csa/identifiers/series.rb +127 -0
  241. data/lib/pubid/csa/identifiers/standard.rb +10 -0
  242. data/lib/pubid/csa/identifiers.rb +17 -0
  243. data/lib/pubid/csa/parser.rb +445 -0
  244. data/lib/pubid/csa/scheme.rb +44 -0
  245. data/lib/pubid/csa/single_identifier.rb +30 -0
  246. data/lib/pubid/csa/urn_generator.rb +80 -0
  247. data/lib/pubid/csa/wrapper_identifier.rb +31 -0
  248. data/lib/pubid/csa.rb +25 -0
  249. data/lib/pubid/etsi/builder.rb +133 -0
  250. data/lib/pubid/etsi/components/code.rb +42 -0
  251. data/lib/pubid/etsi/components/version.rb +37 -0
  252. data/lib/pubid/etsi/components.rb +10 -0
  253. data/lib/pubid/etsi/identifier.rb +14 -0
  254. data/lib/pubid/etsi/identifiers/amendment.rb +15 -0
  255. data/lib/pubid/etsi/identifiers/base.rb +38 -0
  256. data/lib/pubid/etsi/identifiers/corrigendum.rb +15 -0
  257. data/lib/pubid/etsi/identifiers/etsi_standard.rb +19 -0
  258. data/lib/pubid/etsi/identifiers/supplement_identifier.rb +91 -0
  259. data/lib/pubid/etsi/identifiers.rb +14 -0
  260. data/lib/pubid/etsi/parser.rb +133 -0
  261. data/lib/pubid/etsi/scheme.rb +42 -0
  262. data/lib/pubid/etsi/urn_generator.rb +76 -0
  263. data/lib/pubid/etsi.rb +21 -0
  264. data/lib/pubid/export/auditor.rb +89 -0
  265. data/lib/pubid/export/data_class_exporter.rb +59 -0
  266. data/lib/pubid/export/exporter.rb +74 -0
  267. data/lib/pubid/export/flavor_exporter.rb +402 -0
  268. data/lib/pubid/export/ieee_exporter.rb +78 -0
  269. data/lib/pubid/export/itu_exporter.rb +66 -0
  270. data/lib/pubid/export/nist_exporter.rb +64 -0
  271. data/lib/pubid/export/registry_exporter.rb +90 -0
  272. data/lib/pubid/export/result.rb +97 -0
  273. data/lib/pubid/export/scheme_exporter.rb +70 -0
  274. data/lib/pubid/export.rb +18 -0
  275. data/lib/pubid/format_detector.rb +16 -0
  276. data/lib/pubid/format_registry.rb +42 -0
  277. data/lib/pubid/identifier.rb +235 -0
  278. data/lib/pubid/identifier_metadata.rb +148 -0
  279. data/lib/pubid/identifier_registry.rb +198 -0
  280. data/lib/pubid/idf/builder.rb +82 -0
  281. data/lib/pubid/idf/identifier.rb +69 -0
  282. data/lib/pubid/idf/identifiers/amendment.rb +27 -0
  283. data/lib/pubid/idf/identifiers/corrigendum.rb +27 -0
  284. data/lib/pubid/idf/identifiers/international_standard.rb +123 -0
  285. data/lib/pubid/idf/identifiers/reviewed_method.rb +100 -0
  286. data/lib/pubid/idf/identifiers.rb +13 -0
  287. data/lib/pubid/idf/parser.rb +143 -0
  288. data/lib/pubid/idf/scheme.rb +61 -0
  289. data/lib/pubid/idf/single_identifier.rb +19 -0
  290. data/lib/pubid/idf/supplement_identifier.rb +43 -0
  291. data/lib/pubid/idf/urn_generator.rb +84 -0
  292. data/lib/pubid/idf.rb +25 -0
  293. data/lib/pubid/iec/builder.rb +457 -0
  294. data/lib/pubid/iec/components/code.rb +59 -0
  295. data/lib/pubid/iec/components/consolidated_amendment.rb +59 -0
  296. data/lib/pubid/iec/components/publisher.rb +35 -0
  297. data/lib/pubid/iec/components/sheet.rb +32 -0
  298. data/lib/pubid/iec/components/trf_info.rb +38 -0
  299. data/lib/pubid/iec/components/vap_suffix.rb +41 -0
  300. data/lib/pubid/iec/identifier.rb +21 -0
  301. data/lib/pubid/iec/identifiers/amendment.rb +94 -0
  302. data/lib/pubid/iec/identifiers/base.rb +78 -0
  303. data/lib/pubid/iec/identifiers/component_specification.rb +39 -0
  304. data/lib/pubid/iec/identifiers/conformity_assessment.rb +39 -0
  305. data/lib/pubid/iec/identifiers/consolidated_identifier.rb +86 -0
  306. data/lib/pubid/iec/identifiers/corrigendum.rb +94 -0
  307. data/lib/pubid/iec/identifiers/fragment_identifier.rb +141 -0
  308. data/lib/pubid/iec/identifiers/guide.rb +104 -0
  309. data/lib/pubid/iec/identifiers/international_standard.rb +147 -0
  310. data/lib/pubid/iec/identifiers/interpretation_sheet.rb +104 -0
  311. data/lib/pubid/iec/identifiers/operational_document.rb +39 -0
  312. data/lib/pubid/iec/identifiers/publicly_available_specification.rb +101 -0
  313. data/lib/pubid/iec/identifiers/sheet_identifier.rb +66 -0
  314. data/lib/pubid/iec/identifiers/societal_technology_trend_report.rb +40 -0
  315. data/lib/pubid/iec/identifiers/systems_reference_document.rb +40 -0
  316. data/lib/pubid/iec/identifiers/technical_report.rb +132 -0
  317. data/lib/pubid/iec/identifiers/technical_specification.rb +132 -0
  318. data/lib/pubid/iec/identifiers/technology_report.rb +39 -0
  319. data/lib/pubid/iec/identifiers/test_report_form.rb +78 -0
  320. data/lib/pubid/iec/identifiers/vap_identifier.rb +77 -0
  321. data/lib/pubid/iec/identifiers/white_paper.rb +39 -0
  322. data/lib/pubid/iec/identifiers/working_document.rb +96 -0
  323. data/lib/pubid/iec/parser.rb +412 -0
  324. data/lib/pubid/iec/rendering_style.rb +113 -0
  325. data/lib/pubid/iec/scheme.rb +71 -0
  326. data/lib/pubid/iec/single_identifier.rb +80 -0
  327. data/lib/pubid/iec/supplement_identifier.rb +161 -0
  328. data/lib/pubid/iec/urn_generator.rb +193 -0
  329. data/lib/pubid/iec/urn_parser.rb +289 -0
  330. data/lib/pubid/iec.rb +85 -0
  331. data/lib/pubid/ieee/aiee/builder.rb +71 -0
  332. data/lib/pubid/ieee/aiee/identifier.rb +105 -0
  333. data/lib/pubid/ieee/aiee/parser.rb +130 -0
  334. data/lib/pubid/ieee/aiee.rb +11 -0
  335. data/lib/pubid/ieee/builder.rb +1237 -0
  336. data/lib/pubid/ieee/components/code.rb +102 -0
  337. data/lib/pubid/ieee/components/draft.rb +93 -0
  338. data/lib/pubid/ieee/components/relationship.rb +157 -0
  339. data/lib/pubid/ieee/components/typed_stage.rb +100 -0
  340. data/lib/pubid/ieee/identifier.rb +13 -0
  341. data/lib/pubid/ieee/identifiers/adopted_standard.rb +33 -0
  342. data/lib/pubid/ieee/identifiers/base.rb +591 -0
  343. data/lib/pubid/ieee/identifiers/conformance_identifier.rb +35 -0
  344. data/lib/pubid/ieee/identifiers/corrigendum.rb +37 -0
  345. data/lib/pubid/ieee/identifiers/csa_dual_published.rb +51 -0
  346. data/lib/pubid/ieee/identifiers/dual_identifier.rb +18 -0
  347. data/lib/pubid/ieee/identifiers/dual_published.rb +28 -0
  348. data/lib/pubid/ieee/identifiers/iec_ieee_copublished.rb +27 -0
  349. data/lib/pubid/ieee/identifiers/interpretation_identifier.rb +34 -0
  350. data/lib/pubid/ieee/identifiers/joint_development.rb +172 -0
  351. data/lib/pubid/ieee/identifiers/multi_numbered_identifier.rb +51 -0
  352. data/lib/pubid/ieee/identifiers/nesc/base.rb +56 -0
  353. data/lib/pubid/ieee/identifiers/nesc/draft.rb +28 -0
  354. data/lib/pubid/ieee/identifiers/nesc/handbook.rb +32 -0
  355. data/lib/pubid/ieee/identifiers/nesc/redline.rb +26 -0
  356. data/lib/pubid/ieee/identifiers/nesc/standard.rb +26 -0
  357. data/lib/pubid/ieee/identifiers/nesc.rb +15 -0
  358. data/lib/pubid/ieee/identifiers/parenthetical_identifier.rb +20 -0
  359. data/lib/pubid/ieee/identifiers/project_draft_identifier.rb +26 -0
  360. data/lib/pubid/ieee/identifiers/redlined_standard.rb +33 -0
  361. data/lib/pubid/ieee/identifiers/si_standard.rb +73 -0
  362. data/lib/pubid/ieee/identifiers/standard.rb +41 -0
  363. data/lib/pubid/ieee/identifiers/supplement_identifier.rb +23 -0
  364. data/lib/pubid/ieee/identifiers.rb +33 -0
  365. data/lib/pubid/ieee/ire/builder.rb +61 -0
  366. data/lib/pubid/ieee/ire/identifier.rb +58 -0
  367. data/lib/pubid/ieee/ire/parser.rb +91 -0
  368. data/lib/pubid/ieee/ire.rb +11 -0
  369. data/lib/pubid/ieee/nesc/builder.rb +101 -0
  370. data/lib/pubid/ieee/nesc/parser.rb +154 -0
  371. data/lib/pubid/ieee/nesc.rb +10 -0
  372. data/lib/pubid/ieee/parser.rb +1226 -0
  373. data/lib/pubid/ieee/scheme.rb +90 -0
  374. data/lib/pubid/ieee/typed_stages.rb +172 -0
  375. data/lib/pubid/ieee/urn_generator.rb +188 -0
  376. data/lib/pubid/ieee.rb +32 -0
  377. data/lib/pubid/ieee_debug.rb +31 -0
  378. data/lib/pubid/iho/builder.rb +37 -0
  379. data/lib/pubid/iho/identifier.rb +19 -0
  380. data/lib/pubid/iho/identifiers/base.rb +41 -0
  381. data/lib/pubid/iho/identifiers/bibliographic.rb +20 -0
  382. data/lib/pubid/iho/identifiers/circular_letter.rb +19 -0
  383. data/lib/pubid/iho/identifiers/miscellaneous.rb +20 -0
  384. data/lib/pubid/iho/identifiers/publication.rb +19 -0
  385. data/lib/pubid/iho/identifiers/standard.rb +19 -0
  386. data/lib/pubid/iho/identifiers.rb +14 -0
  387. data/lib/pubid/iho/parser.rb +68 -0
  388. data/lib/pubid/iho/scheme.rb +29 -0
  389. data/lib/pubid/iho/urn_generator.rb +29 -0
  390. data/lib/pubid/iho.rb +21 -0
  391. data/lib/pubid/iso/builder.rb +305 -0
  392. data/lib/pubid/iso/bundled_identifier.rb +85 -0
  393. data/lib/pubid/iso/combined_identifier.rb +22 -0
  394. data/lib/pubid/iso/components/code.rb +36 -0
  395. data/lib/pubid/iso/components/publisher.rb +60 -0
  396. data/lib/pubid/iso/components.rb +12 -0
  397. data/lib/pubid/iso/format_resolver.rb +45 -0
  398. data/lib/pubid/iso/identifier.rb +69 -0
  399. data/lib/pubid/iso/identifiers/addendum.rb +104 -0
  400. data/lib/pubid/iso/identifiers/amendment.rb +128 -0
  401. data/lib/pubid/iso/identifiers/base.rb +115 -0
  402. data/lib/pubid/iso/identifiers/corrigendum.rb +108 -0
  403. data/lib/pubid/iso/identifiers/data.rb +76 -0
  404. data/lib/pubid/iso/identifiers/directives.rb +59 -0
  405. data/lib/pubid/iso/identifiers/directives_supplement.rb +119 -0
  406. data/lib/pubid/iso/identifiers/extract.rb +30 -0
  407. data/lib/pubid/iso/identifiers/guide.rb +100 -0
  408. data/lib/pubid/iso/identifiers/international_standard.rb +168 -0
  409. data/lib/pubid/iso/identifiers/international_standardized_profile.rb +94 -0
  410. data/lib/pubid/iso/identifiers/international_workshop_agreement.rb +89 -0
  411. data/lib/pubid/iso/identifiers/pas.rb +93 -0
  412. data/lib/pubid/iso/identifiers/recommendation.rb +45 -0
  413. data/lib/pubid/iso/identifiers/supplement.rb +87 -0
  414. data/lib/pubid/iso/identifiers/tc_document.rb +108 -0
  415. data/lib/pubid/iso/identifiers/technical_report.rb +103 -0
  416. data/lib/pubid/iso/identifiers/technical_specification.rb +102 -0
  417. data/lib/pubid/iso/identifiers/technology_trends_assessments.rb +95 -0
  418. data/lib/pubid/iso/identifiers.rb +33 -0
  419. data/lib/pubid/iso/parser.rb +510 -0
  420. data/lib/pubid/iso/rendering_style.rb +120 -0
  421. data/lib/pubid/iso/scheme.rb +187 -0
  422. data/lib/pubid/iso/single_identifier.rb +61 -0
  423. data/lib/pubid/iso/supplement_identifier.rb +27 -0
  424. data/lib/pubid/iso/urn_generator.rb +412 -0
  425. data/lib/pubid/iso/urn_parser.rb +423 -0
  426. data/lib/pubid/iso/utilities.rb +86 -0
  427. data/lib/pubid/iso.rb +50 -0
  428. data/lib/pubid/itu/builder.rb +171 -0
  429. data/lib/pubid/itu/components/code.rb +39 -0
  430. data/lib/pubid/itu/components/sector.rb +35 -0
  431. data/lib/pubid/itu/components/series.rb +29 -0
  432. data/lib/pubid/itu/i18n.rb +9 -0
  433. data/lib/pubid/itu/i18n.yaml +30 -0
  434. data/lib/pubid/itu/identifier.rb +53 -0
  435. data/lib/pubid/itu/identifiers/amendment.rb +43 -0
  436. data/lib/pubid/itu/identifiers/annex.rb +74 -0
  437. data/lib/pubid/itu/identifiers/base.rb +154 -0
  438. data/lib/pubid/itu/identifiers/combined_identifier.rb +47 -0
  439. data/lib/pubid/itu/identifiers/corrigendum.rb +44 -0
  440. data/lib/pubid/itu/identifiers/recommendation.rb +16 -0
  441. data/lib/pubid/itu/identifiers/special_publication.rb +31 -0
  442. data/lib/pubid/itu/identifiers/supplement.rb +46 -0
  443. data/lib/pubid/itu/identifiers.rb +16 -0
  444. data/lib/pubid/itu/model.rb +111 -0
  445. data/lib/pubid/itu/parser.rb +225 -0
  446. data/lib/pubid/itu/scheme.rb +174 -0
  447. data/lib/pubid/itu/urn_generator.rb +105 -0
  448. data/lib/pubid/itu.rb +22 -0
  449. data/lib/pubid/jcgm/builder.rb +88 -0
  450. data/lib/pubid/jcgm/components/publisher.rb +20 -0
  451. data/lib/pubid/jcgm/components.rb +9 -0
  452. data/lib/pubid/jcgm/identifier.rb +11 -0
  453. data/lib/pubid/jcgm/identifiers/amendment.rb +35 -0
  454. data/lib/pubid/jcgm/identifiers/guide.rb +21 -0
  455. data/lib/pubid/jcgm/identifiers/gum_guide.rb +51 -0
  456. data/lib/pubid/jcgm/identifiers.rb +11 -0
  457. data/lib/pubid/jcgm/parser.rb +84 -0
  458. data/lib/pubid/jcgm/scheme.rb +60 -0
  459. data/lib/pubid/jcgm/single_identifier.rb +48 -0
  460. data/lib/pubid/jcgm/supplement_identifier.rb +16 -0
  461. data/lib/pubid/jcgm/urn_generator.rb +110 -0
  462. data/lib/pubid/jcgm.rb +31 -0
  463. data/lib/pubid/jis/builder.rb +124 -0
  464. data/lib/pubid/jis/components/code.rb +59 -0
  465. data/lib/pubid/jis/components.rb +9 -0
  466. data/lib/pubid/jis/identifier.rb +18 -0
  467. data/lib/pubid/jis/identifiers/amendment.rb +16 -0
  468. data/lib/pubid/jis/identifiers/base.rb +72 -0
  469. data/lib/pubid/jis/identifiers/explanation.rb +22 -0
  470. data/lib/pubid/jis/identifiers/japanese_industrial_standard.rb +16 -0
  471. data/lib/pubid/jis/identifiers/standard.rb +27 -0
  472. data/lib/pubid/jis/identifiers/technical_report.rb +31 -0
  473. data/lib/pubid/jis/identifiers/technical_specification.rb +31 -0
  474. data/lib/pubid/jis/identifiers.rb +17 -0
  475. data/lib/pubid/jis/parser.rb +109 -0
  476. data/lib/pubid/jis/scheme.rb +49 -0
  477. data/lib/pubid/jis/single_identifier.rb +37 -0
  478. data/lib/pubid/jis/supplement_identifier.rb +47 -0
  479. data/lib/pubid/jis/urn_generator.rb +25 -0
  480. data/lib/pubid/jis.rb +23 -0
  481. data/lib/pubid/lutaml/no_store_registration.rb +30 -0
  482. data/lib/pubid/nist/builder.rb +2100 -0
  483. data/lib/pubid/nist/components/code.rb +38 -0
  484. data/lib/pubid/nist/components/edition.rb +118 -0
  485. data/lib/pubid/nist/components/issue_number.rb +28 -0
  486. data/lib/pubid/nist/components/part.rb +77 -0
  487. data/lib/pubid/nist/components/publisher.rb +24 -0
  488. data/lib/pubid/nist/components/stage.rb +53 -0
  489. data/lib/pubid/nist/components/supplement.rb +121 -0
  490. data/lib/pubid/nist/components/translation.rb +42 -0
  491. data/lib/pubid/nist/components/update.rb +103 -0
  492. data/lib/pubid/nist/components/version.rb +35 -0
  493. data/lib/pubid/nist/components/volume.rb +32 -0
  494. data/lib/pubid/nist/components.rb +19 -0
  495. data/lib/pubid/nist/configuration.rb +77 -0
  496. data/lib/pubid/nist/identifiers/base.rb +499 -0
  497. data/lib/pubid/nist/identifiers/circular.rb +68 -0
  498. data/lib/pubid/nist/identifiers/circular_supplement.rb +50 -0
  499. data/lib/pubid/nist/identifiers/commercial_standard.rb +41 -0
  500. data/lib/pubid/nist/identifiers/commercial_standard_emergency.rb +56 -0
  501. data/lib/pubid/nist/identifiers/commercial_standards_monthly.rb +56 -0
  502. data/lib/pubid/nist/identifiers/crpl_report.rb +135 -0
  503. data/lib/pubid/nist/identifiers/federal_information_processing_standards.rb +94 -0
  504. data/lib/pubid/nist/identifiers/grant_contractor_report.rb +35 -0
  505. data/lib/pubid/nist/identifiers/handbook.rb +50 -0
  506. data/lib/pubid/nist/identifiers/internal_report.rb +56 -0
  507. data/lib/pubid/nist/identifiers/letter_circular.rb +45 -0
  508. data/lib/pubid/nist/identifiers/miscellaneous_publication.rb +65 -0
  509. data/lib/pubid/nist/identifiers/monograph.rb +69 -0
  510. data/lib/pubid/nist/identifiers/ncstar.rb +41 -0
  511. data/lib/pubid/nist/identifiers/nsrds.rb +41 -0
  512. data/lib/pubid/nist/identifiers/owmwp.rb +35 -0
  513. data/lib/pubid/nist/identifiers/report.rb +68 -0
  514. data/lib/pubid/nist/identifiers/special_publication.rb +36 -0
  515. data/lib/pubid/nist/identifiers/technical_note.rb +90 -0
  516. data/lib/pubid/nist/identifiers.rb +33 -0
  517. data/lib/pubid/nist/parser.rb +1084 -0
  518. data/lib/pubid/nist/scheme.rb +199 -0
  519. data/lib/pubid/nist/supplement_identifier.rb +83 -0
  520. data/lib/pubid/nist/urn_generator.rb +127 -0
  521. data/lib/pubid/nist.rb +36 -0
  522. data/lib/pubid/oiml/builder.rb +189 -0
  523. data/lib/pubid/oiml/components/code.rb +20 -0
  524. data/lib/pubid/oiml/components.rb +9 -0
  525. data/lib/pubid/oiml/identifier.rb +11 -0
  526. data/lib/pubid/oiml/identifiers/amendment.rb +13 -0
  527. data/lib/pubid/oiml/identifiers/annex.rb +62 -0
  528. data/lib/pubid/oiml/identifiers/base.rb +36 -0
  529. data/lib/pubid/oiml/identifiers/basic_publication.rb +13 -0
  530. data/lib/pubid/oiml/identifiers/document.rb +13 -0
  531. data/lib/pubid/oiml/identifiers/expert_report.rb +13 -0
  532. data/lib/pubid/oiml/identifiers/guide.rb +13 -0
  533. data/lib/pubid/oiml/identifiers/recommendation.rb +13 -0
  534. data/lib/pubid/oiml/identifiers/seminar_report.rb +13 -0
  535. data/lib/pubid/oiml/identifiers/vocabulary.rb +13 -0
  536. data/lib/pubid/oiml/identifiers.rb +18 -0
  537. data/lib/pubid/oiml/parser.rb +173 -0
  538. data/lib/pubid/oiml/scheme.rb +46 -0
  539. data/lib/pubid/oiml/single_identifier.rb +90 -0
  540. data/lib/pubid/oiml/supplement_identifier.rb +43 -0
  541. data/lib/pubid/oiml/urn_generator.rb +64 -0
  542. data/lib/pubid/oiml.rb +26 -0
  543. data/lib/pubid/parser/common_parse_methods.rb +13 -0
  544. data/lib/pubid/parser/common_parse_rules.rb +56 -0
  545. data/lib/pubid/parser.rb +8 -0
  546. data/lib/pubid/parsers/base.rb +11 -0
  547. data/lib/pubid/parsers/mr_string.rb +93 -0
  548. data/lib/pubid/plateau/builder.rb +50 -0
  549. data/lib/pubid/plateau/identifiers/annex.rb +16 -0
  550. data/lib/pubid/plateau/identifiers/base.rb +51 -0
  551. data/lib/pubid/plateau/identifiers/handbook.rb +34 -0
  552. data/lib/pubid/plateau/identifiers/technical_report.rb +20 -0
  553. data/lib/pubid/plateau/identifiers.rb +12 -0
  554. data/lib/pubid/plateau/parser.rb +63 -0
  555. data/lib/pubid/plateau/scheme.rb +45 -0
  556. data/lib/pubid/plateau/supplement_identifier.rb +72 -0
  557. data/lib/pubid/plateau/urn_generator.rb +29 -0
  558. data/lib/pubid/plateau.rb +25 -0
  559. data/lib/pubid/renderers/base.rb +19 -0
  560. data/lib/pubid/renderers/directives_renderer.rb +62 -0
  561. data/lib/pubid/renderers/guide_renderer.rb +20 -0
  562. data/lib/pubid/renderers/human_readable.rb +58 -0
  563. data/lib/pubid/renderers/iwa_renderer.rb +16 -0
  564. data/lib/pubid/renderers/mr_string.rb +16 -0
  565. data/lib/pubid/renderers/supplement_renderer.rb +33 -0
  566. data/lib/pubid/renderers/urn.rb +11 -0
  567. data/lib/pubid/renderers.rb +14 -0
  568. data/lib/pubid/rendering/base.rb +73 -0
  569. data/lib/pubid/rendering/common.rb +211 -0
  570. data/lib/pubid/rendering/context.rb +156 -0
  571. data/lib/pubid/rendering/date.rb +27 -0
  572. data/lib/pubid/rendering/format.rb +25 -0
  573. data/lib/pubid/rendering/language.rb +21 -0
  574. data/lib/pubid/rendering/numbering.rb +24 -0
  575. data/lib/pubid/rendering/publisher.rb +25 -0
  576. data/lib/pubid/rendering/stage.rb +38 -0
  577. data/lib/pubid/rendering/supplement.rb +46 -0
  578. data/lib/pubid/rendering.rb +16 -0
  579. data/lib/pubid/sae/builder.rb +32 -0
  580. data/lib/pubid/sae/components/code.rb +9 -0
  581. data/lib/pubid/sae/components/date.rb +19 -0
  582. data/lib/pubid/sae/components/type.rb +19 -0
  583. data/lib/pubid/sae/components.rb +11 -0
  584. data/lib/pubid/sae/identifier.rb +14 -0
  585. data/lib/pubid/sae/identifiers/base.rb +42 -0
  586. data/lib/pubid/sae/identifiers.rb +9 -0
  587. data/lib/pubid/sae/parser.rb +55 -0
  588. data/lib/pubid/sae/scheme.rb +47 -0
  589. data/lib/pubid/sae/urn_generator.rb +38 -0
  590. data/lib/pubid/sae.rb +19 -0
  591. data/lib/pubid/scheme.rb +207 -0
  592. data/lib/pubid/urn_generator/base.rb +110 -0
  593. data/lib/pubid/utils/string_normalizer.rb +196 -0
  594. data/lib/pubid/utils.rb +7 -0
  595. data/lib/pubid/version.rb +3 -1
  596. data/lib/pubid.rb +137 -13
  597. data/lib/tasks/docs.rake +37 -0
  598. data/lib/tasks/export.rake +38 -0
  599. data/lib/tasks/website-data.json +7488 -0
  600. metadata +613 -171
  601. data/lib/pubid/registry.rb +0 -30
@@ -0,0 +1,724 @@
1
+ # frozen_string_literal: true
2
+
3
+ require "parslet"
4
+
5
+ module Pubid
6
+ module Ashrae
7
+ # Parser class for ASHRAE identifiers
8
+ # Single Responsibility: Parsing ASHRAE identifier syntax
9
+ class Parser < Parslet::Parser
10
+ # Basic building blocks
11
+ rule(:space) { str(" ") }
12
+ rule(:space?) { space.maybe }
13
+ rule(:dash) { str("-") }
14
+ rule(:dot) { str(".") }
15
+ rule(:slash) { str("/") }
16
+ rule(:lparen) { str("(") }
17
+ rule(:rparen) { str(")") }
18
+ rule(:comma) { str(",") }
19
+ rule(:colon) { str(":") }
20
+
21
+ rule(:digit) { match("[0-9]") }
22
+ rule(:digits) { digit.repeat(1) }
23
+ rule(:letter) { match("[A-Za-z]") }
24
+
25
+ # Year pattern (4 digits starting with 19 or 20)
26
+ rule(:year_digits) do
27
+ (str("19") | str("20")) >> digit.repeat(2, 2)
28
+ end
29
+
30
+ # Reaffirmation year (2 or 4 digits)
31
+ rule(:reaffirmation_year) do
32
+ year_digits | digit.repeat(2, 2)
33
+ end
34
+
35
+ # Publisher
36
+ rule(:publisher) { str("ASHRAE") }
37
+
38
+ # Type (Guideline or Standard)
39
+ rule(:type) do
40
+ str("Guideline") | str("Standard")
41
+ end
42
+
43
+ # Code pattern (e.g., 15, 90.1, 41.10, 118.1, 90A,B,C)
44
+ rule(:code) do
45
+ (
46
+ digits >> # First part (e.g., 15, 90)
47
+ (dot >> digits).repeat(0, 2) >> # Optional dotted parts (e.g., .1, .10)
48
+ # Special pattern for codes like "90A,B,C" (letter + comma-separated letters)
49
+ (
50
+ letter >> # Single letter after digits (e.g., "A" in "90A")
51
+ (comma >> letter).repeat(0, 10) # Optional comma-separated letters (e.g., ",B,C")
52
+ ).maybe # This entire letter+commas pattern is optional
53
+ ).as(:code)
54
+ end
55
+
56
+ # Code with year pattern (e.g., 34-2024, 62.1-2022, 90A-2010) - used when type is missing
57
+ rule(:code_with_year) do
58
+ (
59
+ digits >> # First part (e.g., 34, 62)
60
+ (dot >> digits).repeat(0, 2) >> # Optional dotted parts (e.g., .1)
61
+ # Special pattern for codes like "90A,B,C-2010"
62
+ (
63
+ letter >> # Single letter after digits
64
+ (comma >> letter).repeat(0, 10) # Optional comma-separated letters
65
+ ).maybe >>
66
+ space?.maybe >> dash >>
67
+ year_digits.as(:year)
68
+ ).as(:code_with_year)
69
+ end
70
+
71
+ # Suffix (R for revision, P for proposed)
72
+ rule(:suffix) do
73
+ (str("R") | str("P")).as(:suffix)
74
+ end
75
+
76
+ # Additional copublisher pattern (e.g., /AMCA 210-99 or (ANSI/AMCA 330-97))
77
+ rule(:additional_copublisher) do
78
+ (slash >> (letter.repeat(4,
79
+ 10) >> space >> (digits >> (dash >> digits).maybe).maybe).as(:additional_copublisher)) |
80
+ (lparen >> (str("ANSI") >> slash >> (letter.repeat(2,
81
+ 10) >> (slash >> letter.repeat(2, 10)).repeat(0,
82
+ 2))).as(:additional_copublisher) >> space >> (digits >> (dash >> digits).maybe).maybe >> rparen)
83
+ end
84
+
85
+ # Optional suffix in parentheses (PDF), (I-P and SI versions), long descriptions, etc.
86
+ rule(:optional_suffix) do
87
+ space.maybe >> lparen >> (
88
+ str("PDF") | # Special case for PDF
89
+ (letter.repeat(1, 20) >> (space | digit | comma | dash | dot | letter | str("–")).repeat(0, 500)) # General case including long descriptions
90
+ ) >> rparen
91
+ end
92
+
93
+ # Reaffirmation pattern (RA YEAR or RA-YEAR)
94
+ rule(:reaffirmed) do
95
+ (space.maybe >> lparen >> str("RA") >> space? >> reaffirmation_year.as(:reaffirmed) >> rparen) |
96
+ (space.maybe >> lparen >> str("RA") >> dash >> reaffirmation_year.as(:reaffirmed) >> rparen) |
97
+ (space >> str("RA") >> space >> reaffirmation_year.as(:reaffirmed)) |
98
+ (space >> str("RA") >> dash >> reaffirmation_year.as(:reaffirmed))
99
+ end
100
+
101
+ # Addendum code (single letter, multi-letter, or numeric-prefixed like 62o)
102
+ rule(:addendum_code) do
103
+ (digits.maybe >> letter.repeat(1, 3)).as(:addendum_code)
104
+ end
105
+
106
+ # Addendum date pattern (Month Day, Year - e.g., "January 22, 2019")
107
+ rule(:month_name) do
108
+ str("January") | str("February") | str("March") | str("April") | str("May") |
109
+ str("June") | str("July") | str("August") | str("September") | str("October") |
110
+ str("November") | str("December")
111
+ end
112
+
113
+ rule(:errata_date) do
114
+ # Full date: (Month Day, Year)
115
+ (lparen >> month_name >> space >> digit.repeat(1,
116
+ 2) >> comma.maybe >> (space | comma.maybe) >>
117
+ year_digits.as(:errata_year) >> rparen).as(:errata_date) |
118
+ # Month+day without year: (August 27)
119
+ (lparen >> month_name >> space >> digit.repeat(1,
120
+ 2) >> rparen).as(:errata_date) |
121
+ # Numeric date with dash: (7-17- 2003) or (7-17-2003)
122
+ (lparen >> digit.repeat(1, 2) >> dash >> digit.repeat(1,
123
+ 2) >> dash >> space.maybe >> year_digits.as(:errata_year) >> rparen).as(:errata_date)
124
+ end
125
+
126
+ # Errata suffix pattern - handles descriptive text like "– Spanish Edition" after "Errata"
127
+ rule(:errata_suffix) do
128
+ # Regular dash or em dash
129
+ (space >> (str("-") | str("–")) >> space >> (letter >> (space | letter | digit | comma).repeat(0, 50))).repeat(
130
+ 0, 3
131
+ )
132
+ end
133
+
134
+ # Errata suffix on addendum (e.g., "ASHRAE Addendum a to Standard 15-2001 Errata (July 6, 2021)")
135
+ rule(:errata_suffix_on_addendum) do
136
+ space >> str("Errata").as(:errata_keyword) >>
137
+ (
138
+ # Full date: (Month Day, Year)
139
+ (space >> lparen >> month_name >> space >> digit.repeat(1,
140
+ 2) >> comma.maybe >> (space | comma.maybe) >> year_digits >> rparen) |
141
+ # Month+day without year: (August 27)
142
+ (space >> lparen >> month_name >> space >> digit.repeat(1,
143
+ 2) >> rparen) |
144
+ # Numeric date with dash: (7-17-2003)
145
+ (space >> lparen >> digit.repeat(1,
146
+ 2) >> dash >> digit.repeat(1,
147
+ 2) >> dash >> space.maybe >> year_digits >> rparen) |
148
+ # No date at all
149
+ str("")
150
+ )
151
+ end
152
+
153
+ # Errata pattern (base identifier + " Errata (date)")
154
+ rule(:errata_identifier) do
155
+ # Format with copublisher: ANSI/ASHRAE Standard 105-2014 Errata (May 23, 2014)
156
+ ((
157
+ (
158
+ (str("ANSI") >> dash >> str("ASHRAE")) |
159
+ (str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
160
+ 0, 10
161
+ ))
162
+ ).as(:copublisher) >> space >>
163
+ type.as(:type) >> space >>
164
+ code >>
165
+ (space?.maybe >> dash >> year_digits.as(:year)).maybe >>
166
+ (space >> additional_copublisher).maybe >>
167
+ suffix.maybe >>
168
+ reaffirmed.maybe
169
+ ).as(:base_identifier) >>
170
+ space >>
171
+ str("Errata").as(:errata_keyword) >>
172
+ (
173
+ (errata_suffix >> errata_date) |
174
+ (errata_date >> errata_suffix) |
175
+ errata_date |
176
+ errata_suffix
177
+ ).maybe >>
178
+ optional_suffix.repeat(0, 2).as(:optional_suffixes)) |
179
+ # Format with copublisher, missing type: ANSI/ASHRAE 51-1999 Errata (May 23, 2014)
180
+ ((
181
+ (
182
+ (str("ANSI") >> dash >> str("ASHRAE")) |
183
+ (str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
184
+ 0, 10
185
+ ))
186
+ ).as(:copublisher) >> space >>
187
+ code_with_year >>
188
+ (space >> additional_copublisher).maybe >>
189
+ suffix.maybe >>
190
+ reaffirmed.maybe
191
+ ).as(:base_identifier) >>
192
+ space >>
193
+ str("Errata").as(:errata_keyword) >>
194
+ (
195
+ (errata_suffix >> errata_date) |
196
+ (errata_date >> errata_suffix) |
197
+ errata_date |
198
+ errata_suffix
199
+ ).maybe >>
200
+ optional_suffix.repeat(0, 2).as(:optional_suffixes)) |
201
+ # Format with publisher: ASHRAE Guideline 0-2005 Errata (September 28, 2011)
202
+ ((
203
+ publisher.as(:publisher) >> space >>
204
+ type.as(:type) >> space >>
205
+ code >>
206
+ (space?.maybe >> dash >> year_digits.as(:year)).maybe >>
207
+ (space >> additional_copublisher).maybe >>
208
+ suffix.maybe >>
209
+ reaffirmed.maybe
210
+ ).as(:base_identifier) >>
211
+ space >>
212
+ str("Errata").as(:errata_keyword) >>
213
+ errata_date.maybe >>
214
+ errata_suffix.maybe >>
215
+ optional_suffix.repeat(0, 2).as(:optional_suffixes))
216
+ end
217
+
218
+ # Interpretation pattern ("Interpretations for Standard X-YYYY")
219
+ rule(:interpretation_identifier) do
220
+ str("Interpretations") >> space >>
221
+ str("for") >> space >>
222
+ (type.as(:type) >> space >> code >> (dash >> year_digits.as(:year)).maybe).as(:base_identifier)
223
+ end
224
+
225
+ # Combined Addenda pattern (multiple addendums grouped together)
226
+ rule(:combined_addenda_identifier) do
227
+ # Format 1: ASHRAE Addenda X, Y and Z to Standard/Guideline X-YYYY
228
+ (
229
+ publisher.as(:publisher) >> space >>
230
+ str("Addenda") >> space >>
231
+ addendum_code >> # First addendum code
232
+ (
233
+ (comma >> space >> str("and") >> space >> addendum_code) | # ", and b"
234
+ (space >> str("and") >> space >> addendum_code) | # "and b"
235
+ (comma >> space >> addendum_code).repeat(1, 10) | # comma-separated: "a, b, c"
236
+ (comma >> addendum_code).repeat(1, 10) # comma without space: "a,b,c"
237
+ ).repeat(0, 3).as(:additional_codes) >> # Multiple groups of codes (0-3 to allow single code)
238
+ space >>
239
+ (str("to") | str("for")) >> space >>
240
+ ((str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
241
+ 0, 10
242
+ )).as(:copublisher) >> space).maybe >>
243
+ type.as(:type) >> space >>
244
+ code >>
245
+ (dash >> year_digits.as(:year)).maybe >>
246
+ (space >> additional_copublisher).maybe >>
247
+ addendum_date_suffix.maybe >>
248
+ optional_suffix.repeat(0, 2)
249
+ ).as(:combined_addenda) |
250
+ # Format 2: ASHRAE Standard X-YYYY: Addenda a, b, c (colon separator)
251
+ (
252
+ publisher.as(:publisher) >> space >>
253
+ type.as(:type) >> space >>
254
+ code >>
255
+ (dash >> year_digits.as(:year)) >>
256
+ ((colon >> space) | space) >>
257
+ str("Addenda") >> space >>
258
+ addendum_code >> # First addendum code
259
+ (
260
+ # Just match all comma-separated values (including "and" as a code)
261
+ (comma >> space >> addendum_code).repeat(1, 50) |
262
+ # Or comma without space
263
+ (comma >> addendum_code).repeat(1, 50)
264
+ ).as(:additional_codes).maybe >> # Entire additional_codes is optional
265
+ optional_suffix.repeat(0, 2)
266
+ ).as(:combined_addenda) |
267
+ # Format 3: ASHRAE Addenda a, b, c to Standard/Guideline X-YYYY (without publisher at start)
268
+ (
269
+ str("Addenda") >> space >>
270
+ addendum_code >> # First addendum code
271
+ (
272
+ (comma >> space >> str("and") >> space >> addendum_code) | # ", and b"
273
+ (space >> str("and") >> space >> addendum_code) | # "and b"
274
+ (comma >> space >> addendum_code).repeat(1, 20) | # comma-separated
275
+ (comma >> addendum_code).repeat(1, 20) # comma without space
276
+ ).repeat(0, 50).as(:additional_codes) >> # Allow 0 for single addendum
277
+ space >>
278
+ (str("to") | str("for")) >> space >>
279
+ ((str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
280
+ 0, 10
281
+ )).as(:copublisher) >> space).maybe >>
282
+ type.as(:type) >> space >>
283
+ code >>
284
+ (dash >> year_digits.as(:year)).maybe >>
285
+ optional_suffix.repeat(0, 2)
286
+ ).as(:combined_addenda) |
287
+ # Format 4: ASHRAE Addenda to Standard/Guideline X-YYYY (without specific codes)
288
+ (
289
+ publisher.as(:publisher) >> space >>
290
+ str("Addenda") >> space >>
291
+ (str("to") | str("for")) >> space >>
292
+ type.as(:type) >> space >>
293
+ code >>
294
+ (dash >> year_digits.as(:year)).maybe >>
295
+ optional_suffix.repeat(0, 2)
296
+ ).as(:combined_addenda) |
297
+ # Format 5: ASHRAE Addenda a, b, c to 105-2007 (missing type keyword)
298
+ (
299
+ publisher.as(:publisher) >> space >>
300
+ str("Addenda") >> space >>
301
+ addendum_code >>
302
+ (
303
+ (comma >> space >> str("and") >> space >> addendum_code) | # ", and b"
304
+ (space >> str("and") >> space >> addendum_code) | # "and b"
305
+ (comma >> space >> addendum_code).repeat(1, 20) | # comma-separated
306
+ (comma >> addendum_code).repeat(1, 20) # comma without space
307
+ ).repeat(0, 50).as(:additional_codes) >> # Allow 0 for single addendum
308
+ space >>
309
+ (str("to") | str("for")) >> space >>
310
+ code_with_year >>
311
+ optional_suffix.repeat(0, 2)
312
+ ).as(:combined_addenda) |
313
+ # Format 6: Addenda a, b, c to 105-2007 (without publisher, missing type)
314
+ (
315
+ str("Addenda") >> space >>
316
+ addendum_code >>
317
+ (
318
+ (comma >> space >> str("and") >> space >> addendum_code) | # ", and b"
319
+ (space >> str("and") >> space >> addendum_code) | # "and b"
320
+ (comma >> space >> addendum_code).repeat(1, 20) | # comma-separated
321
+ (comma >> addendum_code).repeat(1, 20) # comma without space
322
+ ).repeat(0, 50).as(:additional_codes) >> # Allow 0 for single addendum
323
+ space >>
324
+ (str("to") | str("for")) >> space >>
325
+ code_with_year >>
326
+ optional_suffix.repeat(0, 2)
327
+ ).as(:combined_addenda) |
328
+ # Format 7: ASHRAE Standard X-YYYY: Addenda a, b, c (colon or space separator)
329
+ (
330
+ publisher.as(:publisher) >> space >>
331
+ type.as(:type) >> space >>
332
+ code >>
333
+ (dash >> year_digits.as(:year)).maybe >>
334
+ ((colon >> space) | space) >>
335
+ str("Addenda") >> space >>
336
+ addendum_code >> # First addendum code
337
+ (
338
+ # Range pattern: "a through z"
339
+ (space >> str("through") >> space >> addendum_code) |
340
+ # Space or comma separated codes (handles typos like "bl bq")
341
+ ((space | (comma >> space)) >> addendum_code).repeat(1, 50) |
342
+ # Just match all comma-separated values
343
+ (comma >> space >> addendum_code).repeat(1, 50) |
344
+ # Or comma without space
345
+ (comma >> addendum_code).repeat(1, 50)
346
+ ).as(:additional_codes).maybe >>
347
+ (space >> additional_copublisher).maybe >>
348
+ addendum_date_suffix.maybe >>
349
+ optional_suffix.repeat(0, 2)
350
+ ).as(:combined_addenda)
351
+ end
352
+
353
+ # Year-first Addenda Package pattern
354
+ rule(:year_first_addenda_package_identifier) do
355
+ (
356
+ year_digits.as(:package_year) >> space >>
357
+ (
358
+ # Format 1: "YYYY Addenda Supplement Package to Standard X-YYYY"
359
+ (str("Addenda") >> space >> str("Supplement") >> (space >> str("Package")).maybe >> space >> str("to") >> space >>
360
+ ((str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
361
+ 0, 10
362
+ )).as(:copublisher) >> space).maybe >>
363
+ type.as(:type) >> space >> code >> (dash >> year_digits.as(:year)).maybe) |
364
+ # Format 2: "YYYY Supplement Addenda a, b, c to Standard X-YYYY"
365
+ (str("Supplement") >> space >> str("Addenda") >> space >>
366
+ addendum_code >>
367
+ (
368
+ (comma >> space >> addendum_code).repeat(1, 50) |
369
+ (comma >> addendum_code).repeat(1, 50)
370
+ ).as(:additional_codes).maybe >>
371
+ space >> str("to") >> space >>
372
+ ((str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
373
+ 0, 10
374
+ )).as(:copublisher) >> space).maybe >>
375
+ type.as(:type) >> space >> code >> (dash >> year_digits.as(:year)).maybe
376
+ ) |
377
+ # Format 3: "YYYY Addenda Supplement to Standard X-YYYY" (without "Package")
378
+ (str("Addenda") >> space >> str("Supplement") >> space >> str("to") >> space >>
379
+ ((str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
380
+ 0, 10
381
+ )).as(:copublisher) >> space).maybe >>
382
+ type.as(:type) >> space >> code >> (dash >> year_digits.as(:year)).maybe) |
383
+ # Format 4: "YYYY Supplement to ANSI/ASHRAE/... Standard X-YYYY Errata (date)"
384
+ (str("Supplement") >> space >> str("to") >> space >>
385
+ ((str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
386
+ 0, 10
387
+ )).as(:copublisher) >> space).maybe >>
388
+ type.as(:type) >> space >> code >> (dash >> year_digits.as(:year)).maybe >>
389
+ errata_suffix_on_addendum.maybe)
390
+ ) >>
391
+ optional_suffix.repeat(0, 2)
392
+ ).as(:addenda_package)
393
+ end
394
+
395
+ # Addenda Package pattern (collection packages)
396
+ rule(:addenda_package_identifier) do
397
+ # Format with copublisher: ANSI/ASHRAE Standard 34-2013 Addenda Supplement Package (...)
398
+ (
399
+ (str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
400
+ 0, 10
401
+ )).as(:copublisher) >> space >>
402
+ type.as(:type) >> space >>
403
+ code >>
404
+ (dash >> year_digits.as(:year)).maybe >>
405
+ ((colon >> space) | space) >>
406
+ str("Addenda") >> space >>
407
+ ((str("Supplement") >> (space >> str("Package")).maybe) | str("Package")).as(:package_description) >>
408
+ (space >> str("for") >> space >> year_digits.as(:target_year)).maybe >>
409
+ optional_suffix.repeat(0, 3)
410
+ ).as(:addenda_package) |
411
+ # Format with publisher + comma Addenda YEAR Supplement: ASHRAE Standard 90.1-2010, Addenda 2012 Supplement: Addenda Supplement Package
412
+ (
413
+ publisher.as(:publisher) >> space >>
414
+ type.as(:type) >> space >>
415
+ code >>
416
+ (dash >> year_digits.as(:year)).maybe >>
417
+ comma >> space >> str("Addenda") >> space >> year_digits.as(:package_year) >> space >> str("Supplement") >> colon >> space >>
418
+ str("Addenda") >> space >>
419
+ ((str("Supplement") >> (space >> str("Package")).maybe) | str("Package")).as(:package_description) >>
420
+ optional_suffix.repeat(0, 3)
421
+ ).as(:addenda_package) |
422
+ # Standard format with publisher: ASHRAE Standard X-YYYY Addenda Supplement Package
423
+ (
424
+ publisher.as(:publisher) >> space >>
425
+ type.as(:type) >> space >>
426
+ code >>
427
+ (dash >> year_digits.as(:year)).maybe >>
428
+ (space >> year_digits.as(:package_year)).maybe >>
429
+ additional_copublisher.maybe >>
430
+ suffix.maybe >>
431
+ reaffirmed.maybe >>
432
+ ((colon >> space) | space) >>
433
+ str("Addenda") >> space >>
434
+ ((str("Supplement") >> (space >> str("Package")).maybe) | str("Package")).as(:package_description) >>
435
+ (space >> str("for") >> space >> year_digits.as(:target_year)).maybe >>
436
+ optional_suffix.repeat(0, 3)
437
+ ).as(:addenda_package)
438
+ end
439
+
440
+ # Addendum date pattern (Month Day, Year - e.g., "January 22, 2019")
441
+ rule(:addendum_date_suffix) do
442
+ space >> lparen >> month_name >> space >> digit.repeat(1,
443
+ 2) >> comma.maybe >> (space | comma.maybe) >> year_digits >> rparen
444
+ end
445
+
446
+ # Addendum pattern (multiple formats):
447
+ rule(:addendum_identifier) do
448
+ # Format: ASHRAE Addendum X to Standard/Guideline X-YYYY
449
+ (
450
+ publisher.as(:publisher) >> space >>
451
+ str("Addendum") >> space >>
452
+ addendum_code >>
453
+ space >>
454
+ (str("to") | str("for")) >> space >>
455
+ type.as(:type) >> space >>
456
+ code >>
457
+ (dash >> year_digits.as(:year)).maybe >>
458
+ additional_copublisher.maybe >>
459
+ addendum_date_suffix.maybe >>
460
+ errata_suffix_on_addendum.maybe >>
461
+ optional_suffix.repeat(0, 2)
462
+ ).as(:publisher_addendum) |
463
+ # Format: ASHRAE Addendum X to ASHRAE Standard/Guideline X-YYYY (same publisher repeated)
464
+ (
465
+ publisher.as(:publisher) >> space >>
466
+ str("Addendum") >> space >>
467
+ addendum_code >>
468
+ space >>
469
+ (str("to") | str("for")) >> space >>
470
+ publisher.as(:base_publisher) >> space >>
471
+ type.as(:type) >> space >>
472
+ code >>
473
+ (dash >> year_digits.as(:year)).maybe >>
474
+ additional_copublisher.maybe >>
475
+ addendum_date_suffix.maybe >>
476
+ errata_suffix_on_addendum.maybe >>
477
+ optional_suffix.repeat(0, 2)
478
+ ).as(:publisher_base_addendum) |
479
+ # Format: ASHRAE Addendum X to ANSI/ASHRAE Standard/Guideline X-YYYY (ASHRAE publisher + copublisher base)
480
+ (
481
+ publisher.as(:publisher) >> space >>
482
+ str("Addendum") >> space >>
483
+ addendum_code >>
484
+ space >>
485
+ (str("to") | str("for")) >> space >>
486
+ (
487
+ (str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
488
+ 0, 10
489
+ )).as(:copublisher) >>
490
+ space
491
+ ) >>
492
+ type.as(:type) >> space >>
493
+ code >>
494
+ (dash >> year_digits.as(:year)).maybe >>
495
+ addendum_date_suffix.maybe >>
496
+ errata_suffix_on_addendum.maybe >>
497
+ optional_suffix.repeat(0, 2)
498
+ ).as(:publisher_addendum_copublisher) |
499
+ # Format: ASHRAE Addendum X to ANSI/ASHRAE 62.1-2022 (publisher + copublisher, no type)
500
+ (
501
+ publisher.as(:publisher) >> space >>
502
+ str("Addendum") >> space >>
503
+ addendum_code >>
504
+ space >>
505
+ (str("to") | str("for")) >> space >>
506
+ (
507
+ (str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
508
+ 0, 10
509
+ )).as(:copublisher) >>
510
+ space
511
+ ) >>
512
+ code_with_year >>
513
+ additional_copublisher.maybe >>
514
+ addendum_date_suffix.maybe >>
515
+ errata_suffix_on_addendum.maybe >>
516
+ optional_suffix.repeat(0, 2)
517
+ ).as(:publisher_addendum_copublisher_no_type) |
518
+ # Format: [ANSI/ASHRAE] Addendum X to/for [ANSI/ASHRAE] 34-2024 (no type)
519
+ (
520
+ (
521
+ (str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
522
+ 0, 10
523
+ )).as(:copublisher) >>
524
+ space
525
+ ).maybe >>
526
+ str("Addendum") >> space >>
527
+ addendum_code >>
528
+ space >>
529
+ (str("to") | str("for")) >> space >>
530
+ (
531
+ (str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
532
+ 0, 10
533
+ )).as(:copublisher) >>
534
+ space
535
+ ).maybe >> # Make second copublisher optional
536
+ code_with_year >>
537
+ additional_copublisher.maybe >>
538
+ addendum_date_suffix.maybe >>
539
+ errata_suffix_on_addendum.maybe >>
540
+ optional_suffix.repeat(0, 2)
541
+ ).as(:addendum_no_type) |
542
+ # Format: [ANSI/ASHRAE] Addendum X to/for [ANSI/ASHRAE] Standard/Guideline X-YYYY
543
+ (
544
+ (
545
+ (str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
546
+ 0, 10
547
+ )).as(:copublisher) >>
548
+ space
549
+ ).maybe >>
550
+ str("Addendum") >> space >>
551
+ addendum_code >>
552
+ space >>
553
+ (str("to") | str("for")) >> space >>
554
+ (
555
+ (str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
556
+ 0, 10
557
+ )).as(:copublisher) >>
558
+ space
559
+ ).maybe >>
560
+ type.as(:type) >> space >>
561
+ code >>
562
+ (dash >> year_digits.as(:year)).maybe >>
563
+ additional_copublisher.maybe >>
564
+ addendum_date_suffix.maybe >>
565
+ errata_suffix_on_addendum.maybe >>
566
+ optional_suffix.repeat(0, 2)
567
+ ).as(:addendum) |
568
+ # Format: ASHRAE Standard 15-2013 Addendum a
569
+ (
570
+ publisher.as(:publisher) >> space >>
571
+ type.as(:type) >> space >>
572
+ code >>
573
+ (dash >> year_digits.as(:year)).maybe >>
574
+ additional_copublisher.maybe >>
575
+ suffix.maybe >>
576
+ reaffirmed.maybe >>
577
+ ((colon >> space) | space) >>
578
+ (str("Addendum") | str("addendum")) >> space >>
579
+ addendum_code >>
580
+ addendum_date_suffix.maybe >>
581
+ errata_suffix_on_addendum.maybe >>
582
+ optional_suffix.repeat(0, 2)
583
+ ).as(:standard_addendum) |
584
+ # Format: ASHRAE Standard 15-2013 Addendum a (with lowercase and space only)
585
+ (
586
+ publisher.as(:publisher) >> space >>
587
+ type.as(:type) >> space >>
588
+ code >>
589
+ (dash >> year_digits.as(:year)).maybe >>
590
+ additional_copublisher.maybe >>
591
+ suffix.maybe >>
592
+ reaffirmed.maybe >>
593
+ space >>
594
+ (str("Addendum") | str("addendum")) >> space >>
595
+ addendum_code >>
596
+ addendum_date_suffix.maybe >>
597
+ errata_suffix_on_addendum.maybe >>
598
+ optional_suffix.repeat(0, 2)
599
+ ).as(:standard_addendum)
600
+ end
601
+
602
+ # Main identifier pattern
603
+ rule(:identifier) do
604
+ errata_identifier |
605
+ interpretation_identifier |
606
+ combined_addenda_identifier |
607
+ year_first_addenda_package_identifier |
608
+ addenda_package_identifier |
609
+ addendum_identifier |
610
+ # Standalone copublisher pattern (ANSI/AMCA 210-99, AMCA 210-99)
611
+ (((str("ANSI") >> slash).maybe >> letter.repeat(2,
612
+ 10)).as(:copublisher) >>
613
+ space >>
614
+ code_with_year >>
615
+ optional_suffix.repeat(0, 2)) |
616
+ # Copublished patterns without type (ANSI/ASHRAE 34-2024)
617
+ ((str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
618
+ 0, 10
619
+ )).as(:copublisher) >>
620
+ space >>
621
+ code_with_year >>
622
+ (space >> additional_copublisher).maybe >>
623
+ suffix.maybe >>
624
+ reaffirmed.maybe >>
625
+ optional_suffix.repeat(0, 2)) |
626
+ # Copublished patterns with type (ANSI/ASHRAE, ANSI/ASHRAE/ACCA, ANSI/ASHRAE/ASHE/ICC, etc.)
627
+ ((str("ANSI") >> slash >> str("ASHRAE") >> (slash >> letter.repeat(3, 10)).repeat(
628
+ 0, 10
629
+ )).as(:copublisher) >>
630
+ space >>
631
+ type.as(:type).maybe >> space.maybe >>
632
+ code >>
633
+ (space?.maybe >> dash >> year_digits.as(:year)).maybe >>
634
+ (space >> additional_copublisher).maybe >>
635
+ suffix.maybe >>
636
+ reaffirmed.maybe >>
637
+ optional_suffix.repeat(0, 2)) |
638
+ # Standard ASHRAE pattern
639
+ (publisher.as(:publisher) >> space >>
640
+ type.as(:type) >> space >>
641
+ code >>
642
+ (space?.maybe >> dash >> year_digits.as(:year)).maybe >>
643
+ (space >> additional_copublisher).maybe >>
644
+ suffix.maybe >>
645
+ reaffirmed.maybe >>
646
+ optional_suffix.repeat(0, 2)
647
+ ).as(:base)
648
+ end
649
+
650
+ root(:identifier)
651
+
652
+ def self.parse(string)
653
+ # Strip leading/trailing whitespace
654
+ cleaned = string.strip
655
+
656
+ # Handle fixture format: !original!canonical
657
+ # Extract just the original identifier for parsing
658
+ if cleaned.start_with?("!")
659
+ parts = cleaned.split("!")
660
+ # Format: "" (before first !) + "original" + "canonical"
661
+ cleaned = parts[1] if parts.size >= 3
662
+ end
663
+
664
+ # Normalize multiple spaces to single space
665
+ cleaned = cleaned.gsub(/\s+/, " ")
666
+
667
+ # Normalize reaffirmation patterns
668
+ cleaned = cleaned.gsub(/\(RA\s+(\d{4})\)/, "(RA \\1)")
669
+ cleaned = cleaned.gsub(/RA\s+(\d{4})/, "RA \\1")
670
+
671
+ # Remove trailing periods and commas
672
+ cleaned = cleaned.gsub(/[,.]$/, "")
673
+
674
+ # Remove trailing double parentheses (typos in source data)
675
+ cleaned = cleaned.gsub("))", ")")
676
+
677
+ # Fix unclosed trailing parenthesis (data truncation issue)
678
+ open_count = cleaned.count("(")
679
+ close_count = cleaned.count(")")
680
+ if open_count > close_count
681
+ cleaned += ")" * (open_count - close_count)
682
+ end
683
+
684
+ # Normalize dash patterns (remove space around dash in year/code)
685
+ cleaned = cleaned.gsub(/-\s+/, "-")
686
+ cleaned = cleaned.gsub(/\s+/, " ") # Clean up any double spaces created
687
+
688
+ # Preprocess ", and" and " and" patterns in addenda code lists
689
+ # This fixes greedy matching where "and" gets consumed as a code
690
+ # Only replace "and" in code lists (between Addendum/Addenda and to/for/(end)
691
+ # NOT in descriptive text that follows
692
+ if cleaned =~ /\bAddenda\s+/ || cleaned =~ /\bAddendum\s+/
693
+ # Find the boundary where code list ends (to, for, or opening paren)
694
+ boundary_pattern = /\s+(?:to|for|\()/
695
+ boundary_match = cleaned.match(boundary_pattern)
696
+
697
+ if boundary_match
698
+ # Only replace "and" in the portion before the boundary
699
+ boundary_pos = cleaned.index(boundary_match[0])
700
+ before_boundary = cleaned[0...boundary_pos]
701
+ after_boundary = cleaned[boundary_pos..]
702
+
703
+ # Replace ", and" and " and" in the code list portion only
704
+ before_boundary = before_boundary.gsub(/,\s+and\s+/i, ", ")
705
+ before_boundary = before_boundary.gsub(/\s+and\s+/i, ", ")
706
+
707
+ cleaned = before_boundary + after_boundary
708
+ else
709
+ # No boundary found, apply to entire string
710
+ cleaned = cleaned.gsub(/,\s+and\s+/i, ", ")
711
+ cleaned = cleaned.gsub(/\s+and\s+/i, ", ")
712
+ end
713
+
714
+ # Normalize "Addendum" to "Addenda" when followed by multiple codes (comma-separated)
715
+ # Pattern: "Addendum a, b" -> "Addenda a, b"
716
+ cleaned = cleaned.gsub(/\bAddendum\s+([a-z]+)\s*,\s*/i,
717
+ "Addenda \\1, ")
718
+ end
719
+
720
+ new.parse(cleaned)
721
+ end
722
+ end
723
+ end
724
+ end