@tricoteuses/assemblee 1.0.0-next.2 → 1.0.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +2 -0
- package/lib/api.js +23 -7
- package/lib/api.mjs +41 -0
- package/lib/bugs/acteur-00010/plugin.test.js +139 -33
- package/lib/bugs/acteur-00010/plugin.test.mjs +33 -0
- package/lib/bugs/acteur-00010.js +166 -24
- package/lib/bugs/acteur-00010.mjs +31 -0
- package/lib/bugs/agenda-00002/plugin.test.js +178 -52
- package/lib/bugs/agenda-00002/plugin.test.mjs +52 -0
- package/lib/bugs/agenda-00002.js +507 -143
- package/lib/bugs/agenda-00002.mjs +197 -0
- package/lib/bugs/agenda-00008/plugin.test.js +143 -31
- package/lib/bugs/agenda-00008/plugin.test.mjs +31 -0
- package/lib/bugs/agenda-00008.js +180 -25
- package/lib/bugs/agenda-00008.mjs +30 -0
- package/lib/bugs/agenda-00011/plugin.test.js +371 -156
- package/lib/bugs/agenda-00011/plugin.test.mjs +156 -0
- package/lib/bugs/agenda-00011.js +416 -117
- package/lib/bugs/agenda-00011.mjs +150 -0
- package/lib/bugs.js +591 -54
- package/lib/bugs.mjs +93 -0
- package/lib/cleaners/actes_legislatifs.js +149 -61
- package/lib/cleaners/actes_legislatifs.mjs +311 -0
- package/lib/cleaners/acteurs.js +255 -123
- package/lib/cleaners/acteurs.mjs +211 -0
- package/lib/cleaners/amendements.js +242 -117
- package/lib/cleaners/amendements.mjs +292 -0
- package/lib/cleaners/documents.js +147 -62
- package/lib/cleaners/documents.mjs +162 -0
- package/lib/cleaners/dossiers_legislatifs.js +132 -45
- package/lib/cleaners/dossiers_legislatifs.mjs +123 -0
- package/lib/cleaners/index.js +64 -8
- package/lib/cleaners/index.mjs +8 -0
- package/lib/cleaners/organes.js +54 -21
- package/lib/cleaners/organes.mjs +64 -0
- package/lib/cleaners/reunions.js +237 -127
- package/lib/cleaners/reunions.mjs +318 -0
- package/lib/cleaners/scrutins.js +261 -99
- package/lib/cleaners/scrutins.mjs +254 -0
- package/lib/cleaners/xml.js +81 -16
- package/lib/cleaners/xml.mjs +42 -0
- package/lib/datasets.js +284 -153
- package/lib/datasets.mjs +596 -0
- package/lib/dates.js +93 -34
- package/lib/dates.mjs +98 -0
- package/lib/dossiers_legislatifs.js +107 -33
- package/lib/dossiers_legislatifs.mjs +215 -0
- package/lib/file_systems.js +203 -35
- package/lib/file_systems.mjs +64 -0
- package/lib/git.js +139 -41
- package/lib/git.mjs +114 -0
- package/lib/index.js +310 -16
- package/lib/index.mjs +16 -0
- package/lib/inserters.js +355 -131
- package/lib/inserters.mjs +413 -0
- package/lib/loaders.js +900 -440
- package/lib/loaders.mjs +678 -0
- package/lib/organes.js +15 -5
- package/lib/organes.mjs +18 -0
- package/lib/parsers/documents.js +241 -89
- package/lib/parsers/documents.mjs +433 -0
- package/lib/parsers/index.js +36 -3
- package/lib/parsers/index.mjs +3 -0
- package/lib/parsers/recherche_amendements.js +616 -173
- package/lib/parsers/recherche_amendements.mjs +189 -0
- package/lib/raw_types/acteurs_et_organes.d.ts +36 -148
- package/lib/raw_types/acteurs_et_organes.js +228 -506
- package/lib/raw_types/acteurs_et_organes.mjs +1240 -0
- package/lib/raw_types/agendas.js +165 -75
- package/lib/raw_types/agendas.mjs +944 -0
- package/lib/raw_types/amendements.js +165 -77
- package/lib/raw_types/amendements.mjs +1040 -0
- package/lib/raw_types/dossiers_legislatifs.d.ts +1 -43
- package/lib/raw_types/dossiers_legislatifs.js +181 -143
- package/lib/raw_types/dossiers_legislatifs.mjs +1792 -0
- package/lib/raw_types/scrutins.js +144 -61
- package/lib/raw_types/scrutins.mjs +645 -0
- package/lib/scripts/bugs_helper.js +657 -155
- package/lib/scripts/bugs_helper.mjs +286 -0
- package/lib/scripts/clean_data.js +380 -145
- package/lib/scripts/clean_data.mjs +190 -0
- package/lib/scripts/clean_reorganized_data.js +627 -331
- package/lib/scripts/clean_reorganized_data.mjs +520 -0
- package/lib/scripts/diff_amendements.js +159 -73
- package/lib/scripts/diff_amendements.mjs +234 -0
- package/lib/scripts/document_dossiers_legislatifs.js +570 -288
- package/lib/scripts/document_dossiers_legislatifs.mjs +494 -0
- package/lib/scripts/get_today_reunions.js +37 -20
- package/lib/scripts/get_today_reunions.mjs +41 -0
- package/lib/scripts/merge_scrutins.js +121 -39
- package/lib/scripts/merge_scrutins.mjs +69 -0
- package/lib/scripts/parse_textes_lois.js +179 -125
- package/lib/scripts/parse_textes_lois.mjs +215 -0
- package/lib/scripts/raw_types_from_amendements.js +276 -77
- package/lib/scripts/raw_types_from_amendements.mjs +118 -0
- package/lib/scripts/reorganize_data.js +867 -446
- package/lib/scripts/reorganize_data.mjs +712 -0
- package/lib/scripts/retrieve_deputes_photos.js +378 -157
- package/lib/scripts/retrieve_deputes_photos.mjs +230 -0
- package/lib/scripts/retrieve_documents.js +648 -172
- package/lib/scripts/retrieve_documents.mjs +292 -0
- package/lib/scripts/retrieve_open_data.js +286 -85
- package/lib/scripts/retrieve_open_data.mjs +125 -0
- package/lib/scripts/retrieve_pending_amendments.js +302 -69
- package/lib/scripts/retrieve_pending_amendments.mjs +130 -0
- package/lib/scripts/retrieve_senateurs_photos.js +374 -198
- package/lib/scripts/retrieve_senateurs_photos.mjs +277 -0
- package/lib/scripts/retrieve_textes_lois.js +343 -89
- package/lib/scripts/retrieve_textes_lois.mjs +168 -0
- package/lib/scripts/test_load.js +30 -11
- package/lib/scripts/test_load.mjs +26 -0
- package/lib/scripts/test_load_big_files.js +30 -11
- package/lib/scripts/test_load_big_files.mjs +26 -0
- package/lib/scripts/validate_json.js +370 -120
- package/lib/scripts/validate_json.mjs +216 -0
- package/lib/shared_types/codes_actes.js +50 -15
- package/lib/shared_types/codes_actes.mjs +228 -0
- package/lib/strings.js +16 -3
- package/lib/strings.mjs +7 -0
- package/lib/types/acteurs_et_organes.js +156 -71
- package/lib/types/acteurs_et_organes.mjs +918 -0
- package/lib/types/agendas.js +154 -67
- package/lib/types/agendas.mjs +623 -0
- package/lib/types/amendements.js +166 -77
- package/lib/types/amendements.mjs +885 -0
- package/lib/types/dossiers_legislatifs.d.ts +1 -42
- package/lib/types/dossiers_legislatifs.js +182 -143
- package/lib/types/dossiers_legislatifs.mjs +1120 -0
- package/lib/types/legislatures.js +12 -3
- package/lib/types/legislatures.mjs +9 -0
- package/lib/types/scrutins.js +144 -61
- package/lib/types/scrutins.mjs +528 -0
- package/lib/urls.js +44 -25
- package/lib/urls.mjs +201 -0
- package/package.json +33 -12
|
@@ -0,0 +1,433 @@
|
|
|
1
|
+
import assert from "assert";
|
|
2
|
+
import { JSDOM } from "jsdom";
|
|
3
|
+
export function parseTexteLoi(assembleeUrl, page) {
|
|
4
|
+
// Repair HTML.
|
|
5
|
+
const pageSegments = page.split("</style>");
|
|
6
|
+
assert.strictEqual(pageSegments.length, 2, page);
|
|
7
|
+
let html = pageSegments[1].trim();
|
|
8
|
+
assert(html.startsWith("<div"));
|
|
9
|
+
assert(html.endsWith("</div>"));
|
|
10
|
+
html = `<html${html.substring(4, html.length - 6)}</html>`; // Extract subdivisions from HTML.
|
|
11
|
+
|
|
12
|
+
const {
|
|
13
|
+
window
|
|
14
|
+
} = new JSDOM(html);
|
|
15
|
+
const {
|
|
16
|
+
document
|
|
17
|
+
} = window;
|
|
18
|
+
assert.strictEqual(document.children.length, 1);
|
|
19
|
+
const htmlElement = document.children[0];
|
|
20
|
+
assert.strictEqual(htmlElement.children.length, 2);
|
|
21
|
+
const bodyElement = htmlElement.children[1];
|
|
22
|
+
|
|
23
|
+
if (assembleeUrl === "http://www.assemblee-nationale.fr/15/textes/0675.asp") {
|
|
24
|
+
// Repair document.
|
|
25
|
+
assert.strictEqual(bodyElement.children.length, 1);
|
|
26
|
+
const divElement = bodyElement.children[0];
|
|
27
|
+
assert.strictEqual(divElement.tagName, "DIV");
|
|
28
|
+
const newDivElement = bodyElement.insertBefore(document.createElement("div"), divElement);
|
|
29
|
+
bodyElement.insertBefore(document.createElement("br"), divElement);
|
|
30
|
+
|
|
31
|
+
for (const divChild of [...divElement.children]) {
|
|
32
|
+
if (divChild.getAttribute("class") === "a9ArticleNum") {
|
|
33
|
+
break;
|
|
34
|
+
}
|
|
35
|
+
|
|
36
|
+
newDivElement.appendChild(divChild);
|
|
37
|
+
}
|
|
38
|
+
}
|
|
39
|
+
|
|
40
|
+
if (bodyElement.children.length < 3) {
|
|
41
|
+
// Occurs in http://www.assemblee-nationale.fr/15/textes/0326.asp.
|
|
42
|
+
window.close(); // Free memory.
|
|
43
|
+
|
|
44
|
+
return {
|
|
45
|
+
error: {
|
|
46
|
+
code: -1,
|
|
47
|
+
message: "Texte de loi sans contenu"
|
|
48
|
+
},
|
|
49
|
+
html,
|
|
50
|
+
page
|
|
51
|
+
};
|
|
52
|
+
}
|
|
53
|
+
|
|
54
|
+
assert.strictEqual(bodyElement.children[0].tagName, "DIV"); // First child is a DIV describing the document (Assemblée's header). Skip it for now.
|
|
55
|
+
|
|
56
|
+
let bodyChild = bodyElement.children[1];
|
|
57
|
+
assert.strictEqual(bodyChild.tagName, "BR");
|
|
58
|
+
let alineaElement = null;
|
|
59
|
+
let isMultiLinesHeader = false;
|
|
60
|
+
let level = null;
|
|
61
|
+
let levels = [];
|
|
62
|
+
let lineElements = null;
|
|
63
|
+
let nextParentState = null;
|
|
64
|
+
let paragraphChild = null;
|
|
65
|
+
let paragraphElement = null;
|
|
66
|
+
let state = "nextBodyChild";
|
|
67
|
+
let subAlineaElement = null;
|
|
68
|
+
const subdivisions = [];
|
|
69
|
+
let subdivisionAlineasHtml = null;
|
|
70
|
+
let subdivisionAlineasText = null;
|
|
71
|
+
let subdivisionHeadersHtml = null;
|
|
72
|
+
let subdivisionHeadersText = null;
|
|
73
|
+
|
|
74
|
+
while (state !== null) {
|
|
75
|
+
switch (state) {
|
|
76
|
+
case "alineaElement":
|
|
77
|
+
switch (alineaElement.tagName) {
|
|
78
|
+
case "DIV":
|
|
79
|
+
state = "firstSubAlineaElement";
|
|
80
|
+
break;
|
|
81
|
+
|
|
82
|
+
case "H4":
|
|
83
|
+
// TODO
|
|
84
|
+
nextParentState = "nextAlineaElement";
|
|
85
|
+
paragraphElement = alineaElement;
|
|
86
|
+
state = "firstParagraphChild";
|
|
87
|
+
break;
|
|
88
|
+
|
|
89
|
+
case "P":
|
|
90
|
+
nextParentState = "nextAlineaElement";
|
|
91
|
+
paragraphElement = alineaElement;
|
|
92
|
+
state = "firstParagraphChild";
|
|
93
|
+
break;
|
|
94
|
+
|
|
95
|
+
case "OL":
|
|
96
|
+
// TODO
|
|
97
|
+
state = "nextAlineaElement";
|
|
98
|
+
break;
|
|
99
|
+
|
|
100
|
+
case "TABLE":
|
|
101
|
+
// TODO
|
|
102
|
+
state = "nextAlineaElement";
|
|
103
|
+
break;
|
|
104
|
+
|
|
105
|
+
default:
|
|
106
|
+
return {
|
|
107
|
+
error: {
|
|
108
|
+
code: -2,
|
|
109
|
+
message: `Unexpected tag name for alinea element: ${alineaElement.tagName}`
|
|
110
|
+
},
|
|
111
|
+
html,
|
|
112
|
+
page
|
|
113
|
+
};
|
|
114
|
+
}
|
|
115
|
+
|
|
116
|
+
break;
|
|
117
|
+
|
|
118
|
+
case "firstAlineaElement":
|
|
119
|
+
alineaElement = bodyChild.children[0];
|
|
120
|
+
|
|
121
|
+
if (alineaElement === undefined) {
|
|
122
|
+
// No alinea in current bodyChild: go to next bodyChild.
|
|
123
|
+
state = "nextBodyChild";
|
|
124
|
+
} else {
|
|
125
|
+
state = "alineaElement";
|
|
126
|
+
}
|
|
127
|
+
|
|
128
|
+
break;
|
|
129
|
+
|
|
130
|
+
case "firstParagraphChild":
|
|
131
|
+
paragraphChild = paragraphElement.children[0];
|
|
132
|
+
|
|
133
|
+
if (paragraphChild === undefined) {
|
|
134
|
+
// No child in current paragraph: go to next parent element.
|
|
135
|
+
state = nextParentState;
|
|
136
|
+
} else {
|
|
137
|
+
const headerText = paragraphElement.textContent;
|
|
138
|
+
const nameComputed = (headerText || "").normalize("NFD").replace(/[\u0300-\u036f]/g, "").replace(/\(nouveau\)/, "").replace(/\(Pour coordination\)/, "").replace(/\(Supprimés?\)/, "").replace(/ /g, " ").replace(/[\-,.…]/g, "").trim().replace(/ {1,}/g, "_");
|
|
139
|
+
const nameUpper = nameComputed.toUpperCase();
|
|
140
|
+
|
|
141
|
+
if (nameUpper === "") {
|
|
142
|
+
// Occurs in:
|
|
143
|
+
// * http://www.assemblee-nationale.fr/15/textes/0445.asp
|
|
144
|
+
// * http://www.assemblee-nationale.fr/15/textes/0626.asp
|
|
145
|
+
// Skip paragraph.
|
|
146
|
+
state = nextParentState;
|
|
147
|
+
break;
|
|
148
|
+
}
|
|
149
|
+
|
|
150
|
+
const nextLevel = nameUpper.match(/^(RAPPORT_)?ANNEXE(_|$)/) !== null || nameUpper.match(/^ETAT_/) !== null ? 0 : nameUpper.match(/^TOME_/) !== null ? 1 : nameUpper.match(/^PARTIE_/) !== null || nameUpper.match(/^(PREMIERE|SECONDE|DEUXIEME|TROISIEME|QUATRIEME)_PARTIE(_|$)/) !== null ? 2 : nameUpper.match(/^LIVRE_/) !== null ? 3 : nameUpper.match(/^TITRE_/) !== null ? 4 : nameUpper.match(/^SOUSTITRE_/) !== null ? 5 : nameUpper.match(/^CHAPITRE_/) !== null ? 6 : nameUpper.match(/^SECTION_/) !== null ? 7 : nameUpper.match(/^SOUSSECTION_/) !== null ? 8 : nameUpper.match(/^ARTICLES?_/) !== null || // "Exposé des motifs" must be at the same level as article.
|
|
151
|
+
// "Exposé des motifs" without content:
|
|
152
|
+
// * http://www.assemblee-nationale.fr/15/textes/0702.asp
|
|
153
|
+
// "Exposé des motifs" with content:
|
|
154
|
+
// * http://www.assemblee-nationale.fr/15/textes/1326.asp
|
|
155
|
+
// * http://www.assemblee-nationale.fr/15/textes/1610.asp
|
|
156
|
+
nameUpper.match(/^EXPOSE_DES_MOTIFS$/) !== null ? 9 : null;
|
|
157
|
+
|
|
158
|
+
if (nextLevel === null && subdivisions.length === 0) {
|
|
159
|
+
if (nameUpper.match(/^(PROJET|PROPOSITION)_DE_LOI(_|$)/) !== null) {// Occurs in:
|
|
160
|
+
// * http://www.assemblee-nationale.fr/15/textes/0232.asp
|
|
161
|
+
// * http://www.assemblee-nationale.fr/15/textes/0626.asp
|
|
162
|
+
// * http://www.assemblee-nationale.fr/15/textes/0676.asp
|
|
163
|
+
} else if (nameUpper === "JEUX_OLYMPIQUES_ET_PARALYMPIQUES_DE_2024") {// Occurs in http://www.assemblee-nationale.fr/15/textes/0676.asp
|
|
164
|
+
} else if (nameUpper === "TEXTE_DE_LA_COMMISSION_MIXTE_PARITAIRE") {// Occurs in http://www.assemblee-nationale.fr/15/textes/1294.asp
|
|
165
|
+
} else {
|
|
166
|
+
console.log(`Unexpected nameUpper = "${nameUpper}" at beginning of "texte de loi" at ${assembleeUrl}`);
|
|
167
|
+
} // Skip paragraph.
|
|
168
|
+
|
|
169
|
+
|
|
170
|
+
state = nextParentState;
|
|
171
|
+
break;
|
|
172
|
+
}
|
|
173
|
+
|
|
174
|
+
if (nextLevel !== null) {
|
|
175
|
+
level = nextLevel;
|
|
176
|
+
|
|
177
|
+
while (levels.length > 0 && level < levels[levels.length - 1]) {
|
|
178
|
+
levels.pop();
|
|
179
|
+
}
|
|
180
|
+
|
|
181
|
+
if (levels.length === 0 || level > levels[levels.length - 1]) {
|
|
182
|
+
levels.push(level);
|
|
183
|
+
} // Articles & "Exposé des motifs" are the only divisions without second title.
|
|
184
|
+
|
|
185
|
+
|
|
186
|
+
isMultiLinesHeader = nameUpper.match(/^ARTICLES?_/) === null && nameUpper.match(/^EXPOSE_DES_MOTIFS$/) === null;
|
|
187
|
+
subdivisionAlineasHtml = [];
|
|
188
|
+
subdivisionAlineasText = [];
|
|
189
|
+
subdivisionHeadersHtml = [];
|
|
190
|
+
subdivisionHeadersText = [];
|
|
191
|
+
subdivisions.push({
|
|
192
|
+
html: {
|
|
193
|
+
alineas: subdivisionAlineasHtml,
|
|
194
|
+
headers: subdivisionHeadersHtml
|
|
195
|
+
},
|
|
196
|
+
id: "D_" + nameComputed,
|
|
197
|
+
level: level + 1,
|
|
198
|
+
relativeLevel: levels.length,
|
|
199
|
+
text: {
|
|
200
|
+
alineas: subdivisionAlineasText,
|
|
201
|
+
headers: subdivisionHeadersText
|
|
202
|
+
}
|
|
203
|
+
});
|
|
204
|
+
}
|
|
205
|
+
|
|
206
|
+
lineElements = [];
|
|
207
|
+
state = "paragraphChild";
|
|
208
|
+
}
|
|
209
|
+
|
|
210
|
+
break;
|
|
211
|
+
|
|
212
|
+
case "firstSubAlineaElement":
|
|
213
|
+
subAlineaElement = alineaElement.children[0];
|
|
214
|
+
|
|
215
|
+
if (subAlineaElement === undefined) {
|
|
216
|
+
// No sub-alinea in current alinea: go to next alinea.
|
|
217
|
+
state = "nextAlineaElement";
|
|
218
|
+
} else {
|
|
219
|
+
state = "subAlineaElement";
|
|
220
|
+
}
|
|
221
|
+
|
|
222
|
+
break;
|
|
223
|
+
|
|
224
|
+
case "nextAlineaElement":
|
|
225
|
+
alineaElement = alineaElement.nextElementSibling;
|
|
226
|
+
|
|
227
|
+
if (alineaElement === null) {
|
|
228
|
+
// The bodyChild has been fully parsed. Go to next bodyChild
|
|
229
|
+
state = "nextBodyChild";
|
|
230
|
+
} else {
|
|
231
|
+
state = "alineaElement";
|
|
232
|
+
}
|
|
233
|
+
|
|
234
|
+
break;
|
|
235
|
+
|
|
236
|
+
case "nextBodyChild":
|
|
237
|
+
if (bodyChild.nextElementSibling === null) {
|
|
238
|
+
// The document has been fully parsed.
|
|
239
|
+
state = null;
|
|
240
|
+
} else {
|
|
241
|
+
bodyChild = bodyChild.nextElementSibling;
|
|
242
|
+
|
|
243
|
+
if (bodyChild.tagName === "DIV") {
|
|
244
|
+
state = "firstAlineaElement";
|
|
245
|
+
} else {
|
|
246
|
+
// <P/> is for footnotes
|
|
247
|
+
assert(["BR", "HR", "P"].includes(bodyChild.tagName), `Unexpected tag name "${bodyChild.tagName}" for body child`); // Stay in the same state to go to next bodyChild.
|
|
248
|
+
}
|
|
249
|
+
}
|
|
250
|
+
|
|
251
|
+
break;
|
|
252
|
+
|
|
253
|
+
case "nextParagraphChild":
|
|
254
|
+
paragraphChild = paragraphChild.nextElementSibling;
|
|
255
|
+
|
|
256
|
+
if (paragraphChild === null) {
|
|
257
|
+
// The paragraph element has been fully parsed. Go to next parent element.
|
|
258
|
+
const lineText = lineElements.map(element => element.textContent).join("").trim();
|
|
259
|
+
|
|
260
|
+
if (lineText) {
|
|
261
|
+
const lineHtml = lineElements.map(element => element.outerHTML).join("");
|
|
262
|
+
|
|
263
|
+
if (subdivisionHeadersText.length === 0 || isMultiLinesHeader && subdivisionAlineasText.length === 0) {
|
|
264
|
+
subdivisionHeadersHtml.push(lineHtml);
|
|
265
|
+
subdivisionHeadersText.push(lineText);
|
|
266
|
+
} else {
|
|
267
|
+
subdivisionAlineasHtml.push(lineHtml);
|
|
268
|
+
subdivisionAlineasText.push(lineText);
|
|
269
|
+
}
|
|
270
|
+
}
|
|
271
|
+
|
|
272
|
+
if (isMultiLinesHeader && subdivisionHeadersText.length >= 2) {
|
|
273
|
+
isMultiLinesHeader = false;
|
|
274
|
+
}
|
|
275
|
+
|
|
276
|
+
lineElements = null;
|
|
277
|
+
state = nextParentState;
|
|
278
|
+
} else {
|
|
279
|
+
state = "paragraphChild";
|
|
280
|
+
}
|
|
281
|
+
|
|
282
|
+
break;
|
|
283
|
+
|
|
284
|
+
case "nextSubAlineaElement":
|
|
285
|
+
subAlineaElement = subAlineaElement.nextElementSibling;
|
|
286
|
+
|
|
287
|
+
if (subAlineaElement === null) {
|
|
288
|
+
// The alineaElement has been fully parsed. Go to next alineaElement.
|
|
289
|
+
state = "nextAlineaElement";
|
|
290
|
+
} else {
|
|
291
|
+
state = "subAlineaElement";
|
|
292
|
+
}
|
|
293
|
+
|
|
294
|
+
break;
|
|
295
|
+
|
|
296
|
+
case "paragraphChild":
|
|
297
|
+
switch (paragraphChild.tagName) {
|
|
298
|
+
case "A":
|
|
299
|
+
{
|
|
300
|
+
lineElements.push(paragraphChild);
|
|
301
|
+
break;
|
|
302
|
+
}
|
|
303
|
+
|
|
304
|
+
case "BR":
|
|
305
|
+
{
|
|
306
|
+
const lineText = lineElements.map(element => element.textContent).join("").trim();
|
|
307
|
+
|
|
308
|
+
if (lineText) {
|
|
309
|
+
const lineHtml = lineElements.map(element => element.outerHTML).join("");
|
|
310
|
+
|
|
311
|
+
if (subdivisionHeadersText.length === 0 || isMultiLinesHeader && subdivisionAlineasText.length === 0) {
|
|
312
|
+
subdivisionHeadersHtml.push(lineHtml);
|
|
313
|
+
subdivisionHeadersText.push(lineText);
|
|
314
|
+
} else {
|
|
315
|
+
subdivisionAlineasHtml.push(lineHtml);
|
|
316
|
+
subdivisionAlineasText.push(lineText);
|
|
317
|
+
}
|
|
318
|
+
}
|
|
319
|
+
|
|
320
|
+
lineElements = [];
|
|
321
|
+
break;
|
|
322
|
+
}
|
|
323
|
+
|
|
324
|
+
case "DEL":
|
|
325
|
+
{
|
|
326
|
+
lineElements.push(paragraphChild);
|
|
327
|
+
break;
|
|
328
|
+
}
|
|
329
|
+
|
|
330
|
+
case "IMG":
|
|
331
|
+
{
|
|
332
|
+
lineElements.push(paragraphChild);
|
|
333
|
+
break;
|
|
334
|
+
}
|
|
335
|
+
|
|
336
|
+
case "SPAN":
|
|
337
|
+
{
|
|
338
|
+
const className = paragraphChild.getAttribute("class");
|
|
339
|
+
|
|
340
|
+
switch (className) {
|
|
341
|
+
case "aEloiPastille":
|
|
342
|
+
{
|
|
343
|
+
// Skip pastillé SPAN.
|
|
344
|
+
break;
|
|
345
|
+
}
|
|
346
|
+
|
|
347
|
+
case "aEloiPastille0":
|
|
348
|
+
{
|
|
349
|
+
// Skip pastillé SPAN.
|
|
350
|
+
break;
|
|
351
|
+
}
|
|
352
|
+
|
|
353
|
+
default:
|
|
354
|
+
lineElements.push(paragraphChild);
|
|
355
|
+
}
|
|
356
|
+
|
|
357
|
+
break;
|
|
358
|
+
}
|
|
359
|
+
|
|
360
|
+
default:
|
|
361
|
+
return {
|
|
362
|
+
error: {
|
|
363
|
+
code: -3,
|
|
364
|
+
message: `Unexpected tag name for paragraph child: ${paragraphChild.tagName}`
|
|
365
|
+
},
|
|
366
|
+
html,
|
|
367
|
+
page
|
|
368
|
+
};
|
|
369
|
+
}
|
|
370
|
+
|
|
371
|
+
state = "nextParagraphChild";
|
|
372
|
+
break;
|
|
373
|
+
|
|
374
|
+
case "subAlineaElement":
|
|
375
|
+
switch (subAlineaElement.tagName) {
|
|
376
|
+
case "P":
|
|
377
|
+
nextParentState = "nextSubAlineaElement";
|
|
378
|
+
paragraphElement = subAlineaElement;
|
|
379
|
+
state = "firstParagraphChild";
|
|
380
|
+
break;
|
|
381
|
+
|
|
382
|
+
case "TABLE":
|
|
383
|
+
// TODO
|
|
384
|
+
state = "nextSubAlineaElement";
|
|
385
|
+
break;
|
|
386
|
+
|
|
387
|
+
default:
|
|
388
|
+
return {
|
|
389
|
+
error: {
|
|
390
|
+
code: -4,
|
|
391
|
+
message: `Unexpected tag name for sub alinea element: ${subAlineaElement.tagName}`
|
|
392
|
+
},
|
|
393
|
+
html,
|
|
394
|
+
page
|
|
395
|
+
};
|
|
396
|
+
}
|
|
397
|
+
|
|
398
|
+
break;
|
|
399
|
+
state = "nextSubAlineaElement";
|
|
400
|
+
break;
|
|
401
|
+
|
|
402
|
+
default:
|
|
403
|
+
throw `Unexpected state: ${state}`;
|
|
404
|
+
}
|
|
405
|
+
}
|
|
406
|
+
|
|
407
|
+
window.close(); // Free memory.
|
|
408
|
+
|
|
409
|
+
return {
|
|
410
|
+
error: null,
|
|
411
|
+
html,
|
|
412
|
+
page,
|
|
413
|
+
subdivisions,
|
|
414
|
+
url: assembleeUrl
|
|
415
|
+
};
|
|
416
|
+
}
|
|
417
|
+
export async function retrieveTexteLoiParsed(fetch, assembleeUrl) {
|
|
418
|
+
const response = await fetch(assembleeUrl);
|
|
419
|
+
const page = await response.text();
|
|
420
|
+
|
|
421
|
+
if (!response.ok) {
|
|
422
|
+
return {
|
|
423
|
+
error: {
|
|
424
|
+
code: response.status,
|
|
425
|
+
message: response.statusText
|
|
426
|
+
},
|
|
427
|
+
page
|
|
428
|
+
};
|
|
429
|
+
}
|
|
430
|
+
|
|
431
|
+
return parseTexteLoi(assembleeUrl, page);
|
|
432
|
+
}
|
|
433
|
+
//# sourceMappingURL=data:application/json;charset=utf-8;base64,{"version":3,"names":["assert","JSDOM","parseTexteLoi","assembleeUrl","page","pageSegments","split","strictEqual","length","html","trim","startsWith","endsWith","substring","window","document","children","htmlElement","bodyElement","divElement","tagName","newDivElement","insertBefore","createElement","divChild","getAttribute","appendChild","close","error","code","message","bodyChild","alineaElement","isMultiLinesHeader","level","levels","lineElements","nextParentState","paragraphChild","paragraphElement","state","subAlineaElement","subdivisions","subdivisionAlineasHtml","subdivisionAlineasText","subdivisionHeadersHtml","subdivisionHeadersText","undefined","headerText","textContent","nameComputed","normalize","replace","nameUpper","toUpperCase","nextLevel","match","console","log","pop","push","alineas","headers","id","relativeLevel","text","nextElementSibling","includes","lineText","map","element","join","lineHtml","outerHTML","className","url","retrieveTexteLoiParsed","fetch","response","ok","status","statusText"],"sources":["../../src/parsers/documents.ts"],"sourcesContent":["import assert from \"assert\"\nimport { JSDOM } from \"jsdom\"\n\nexport function parseTexteLoi(assembleeUrl: string, page: string) {\n  // Repair HTML.\n  const pageSegments = page.split(\"</style>\")\n  assert.strictEqual(pageSegments.length, 2, page)\n  let html = pageSegments[1].trim()\n  assert(html.startsWith(\"<div\"))\n  assert(html.endsWith(\"</div>\"))\n  html = `<html${html.substring(4, html.length - 6)}</html>`\n\n  // Extract subdivisions from HTML.\n  const { window } = new JSDOM(html)\n  const { document } = window\n  assert.strictEqual(document.children.length, 1)\n  const htmlElement = document.children[0]\n  assert.strictEqual(htmlElement.children.length, 2)\n  const bodyElement = htmlElement.children[1]\n  if (assembleeUrl === \"http://www.assemblee-nationale.fr/15/textes/0675.asp\") {\n    // Repair document.\n    assert.strictEqual(bodyElement.children.length, 1)\n    const divElement = bodyElement.children[0]\n    assert.strictEqual(divElement.tagName, \"DIV\")\n    const newDivElement = bodyElement.insertBefore(\n      document.createElement(\"div\"),\n      divElement,\n    )\n    bodyElement.insertBefore(document.createElement(\"br\"), divElement)\n    for (const divChild of [...divElement.children]) {\n      if (divChild.getAttribute(\"class\") === \"a9ArticleNum\") {\n        break\n      }\n      newDivElement.appendChild(divChild)\n    }\n  }\n  if (bodyElement.children.length < 3) {\n    // Occurs in http://www.assemblee-nationale.fr/15/textes/0326.asp.\n    window.close() // Free memory.\n    return {\n      error: { code: -1, message: \"Texte de loi sans contenu\" },\n      html,\n      page,\n    }\n  }\n  assert.strictEqual(bodyElement.children[0].tagName, \"DIV\")\n  // First child is a DIV describing the document (Assemblée's header). Skip it for now.\n  let bodyChild = bodyElement.children[1]\n  assert.strictEqual(bodyChild.tagName, \"BR\")\n  let alineaElement: Element | null = null\n  let isMultiLinesHeader: boolean = false\n  let level: number | null = null\n  let levels: number[] = []\n  let lineElements: Element[] | null = null\n  let nextParentState = null\n  let paragraphChild: Element | null = null\n  let paragraphElement: Element | null = null\n  let state: string | null = \"nextBodyChild\"\n  let subAlineaElement: Element | null = null\n  const subdivisions = []\n  let subdivisionAlineasHtml: string[] | null = null\n  let subdivisionAlineasText: string[] | null = null\n  let subdivisionHeadersHtml: string[] | null = null\n  let subdivisionHeadersText: string[] | null = null\n  while (state !== null) {\n    switch (state) {\n      case \"alineaElement\":\n        switch (alineaElement!.tagName) {\n          case \"DIV\":\n            state = \"firstSubAlineaElement\"\n            break\n          case \"H4\":\n            // TODO\n            nextParentState = \"nextAlineaElement\"\n            paragraphElement = alineaElement\n            state = \"firstParagraphChild\"\n            break\n          case \"P\":\n            nextParentState = \"nextAlineaElement\"\n            paragraphElement = alineaElement\n            state = \"firstParagraphChild\"\n            break\n          case \"OL\":\n            // TODO\n            state = \"nextAlineaElement\"\n            break\n          case \"TABLE\":\n            // TODO\n            state = \"nextAlineaElement\"\n            break\n          default:\n            return {\n              error: {\n                code: -2,\n                message: `Unexpected tag name for alinea element: ${\n                  alineaElement!.tagName\n                }`,\n              },\n              html,\n              page,\n            }\n        }\n        break\n      case \"firstAlineaElement\":\n        alineaElement = bodyChild.children[0]\n        if (alineaElement === undefined) {\n          // No alinea in current bodyChild: go to next bodyChild.\n          state = \"nextBodyChild\"\n        } else {\n          state = \"alineaElement\"\n        }\n        break\n      case \"firstParagraphChild\":\n        paragraphChild = paragraphElement!.children[0]\n        if (paragraphChild === undefined) {\n          // No child in current paragraph: go to next parent element.\n          state = nextParentState\n        } else {\n          const headerText = paragraphElement!.textContent\n          const nameComputed = (headerText || \"\")\n            .normalize(\"NFD\")\n            .replace(/[\\u0300-\\u036f]/g, \"\")\n            .replace(/\\(nouveau\\)/, \"\")\n            .replace(/\\(Pour coordination\\)/, \"\")\n            .replace(/\\(Supprimés?\\)/, \"\")\n            .replace(/ /g, \" \")\n            .replace(/[\\-,.…]/g, \"\")\n            .trim()\n            .replace(/ {1,}/g, \"_\")\n          const nameUpper = nameComputed.toUpperCase()\n          if (nameUpper === \"\") {\n            // Occurs in:\n            // * http://www.assemblee-nationale.fr/15/textes/0445.asp\n            // * http://www.assemblee-nationale.fr/15/textes/0626.asp\n            // Skip paragraph.\n            state = nextParentState\n            break\n          }\n          const nextLevel =\n            nameUpper.match(/^(RAPPORT_)?ANNEXE(_|$)/) !== null ||\n            nameUpper.match(/^ETAT_/) !== null\n              ? 0\n              : nameUpper.match(/^TOME_/) !== null\n              ? 1\n              : nameUpper.match(/^PARTIE_/) !== null ||\n                nameUpper.match(\n                  /^(PREMIERE|SECONDE|DEUXIEME|TROISIEME|QUATRIEME)_PARTIE(_|$)/,\n                ) !== null\n              ? 2\n              : nameUpper.match(/^LIVRE_/) !== null\n              ? 3\n              : nameUpper.match(/^TITRE_/) !== null\n              ? 4\n              : nameUpper.match(/^SOUSTITRE_/) !== null\n              ? 5\n              : nameUpper.match(/^CHAPITRE_/) !== null\n              ? 6\n              : nameUpper.match(/^SECTION_/) !== null\n              ? 7\n              : nameUpper.match(/^SOUSSECTION_/) !== null\n              ? 8\n              : nameUpper.match(/^ARTICLES?_/) !== null ||\n                // \"Exposé des motifs\" must be at the same level as article.\n                // \"Exposé des motifs\" without content:\n                // * http://www.assemblee-nationale.fr/15/textes/0702.asp\n                // \"Exposé des motifs\" with content:\n                // * http://www.assemblee-nationale.fr/15/textes/1326.asp\n                // * http://www.assemblee-nationale.fr/15/textes/1610.asp\n                nameUpper.match(/^EXPOSE_DES_MOTIFS$/) !== null\n              ? 9\n              : null\n          if (nextLevel === null && subdivisions.length === 0) {\n            if (nameUpper.match(/^(PROJET|PROPOSITION)_DE_LOI(_|$)/) !== null) {\n              // Occurs in:\n              // * http://www.assemblee-nationale.fr/15/textes/0232.asp\n              // * http://www.assemblee-nationale.fr/15/textes/0626.asp\n              // * http://www.assemblee-nationale.fr/15/textes/0676.asp\n            } else if (\n              nameUpper === \"JEUX_OLYMPIQUES_ET_PARALYMPIQUES_DE_2024\"\n            ) {\n              // Occurs in http://www.assemblee-nationale.fr/15/textes/0676.asp\n            } else if (nameUpper === \"TEXTE_DE_LA_COMMISSION_MIXTE_PARITAIRE\") {\n              // Occurs in http://www.assemblee-nationale.fr/15/textes/1294.asp\n            } else {\n              console.log(\n                `Unexpected nameUpper = \"${nameUpper}\" at beginning of \"texte de loi\" at ${assembleeUrl}`,\n              )\n            }\n            // Skip paragraph.\n            state = nextParentState\n            break\n          }\n          if (nextLevel !== null) {\n            level = nextLevel\n            while (levels.length > 0 && level < levels[levels.length - 1]) {\n              levels.pop()\n            }\n            if (levels.length === 0 || level > levels[levels.length - 1]) {\n              levels.push(level)\n            }\n            // Articles & \"Exposé des motifs\" are the only divisions without second title.\n            isMultiLinesHeader =\n              nameUpper.match(/^ARTICLES?_/) === null &&\n              nameUpper.match(/^EXPOSE_DES_MOTIFS$/) === null\n            subdivisionAlineasHtml = []\n            subdivisionAlineasText = []\n            subdivisionHeadersHtml = []\n            subdivisionHeadersText = []\n            subdivisions.push({\n              html: {\n                alineas: subdivisionAlineasHtml,\n                headers: subdivisionHeadersHtml,\n              },\n              id: \"D_\" + nameComputed,\n              level: level + 1,\n              relativeLevel: levels.length,\n              text: {\n                alineas: subdivisionAlineasText,\n                headers: subdivisionHeadersText,\n              },\n            })\n          }\n          lineElements = []\n          state = \"paragraphChild\"\n        }\n        break\n      case \"firstSubAlineaElement\":\n        subAlineaElement = alineaElement!.children[0]\n        if (subAlineaElement === undefined) {\n          // No sub-alinea in current alinea: go to next alinea.\n          state = \"nextAlineaElement\"\n        } else {\n          state = \"subAlineaElement\"\n        }\n        break\n      case \"nextAlineaElement\":\n        alineaElement = alineaElement!.nextElementSibling\n        if (alineaElement === null) {\n          // The bodyChild has been fully parsed. Go to next bodyChild\n          state = \"nextBodyChild\"\n        } else {\n          state = \"alineaElement\"\n        }\n        break\n      case \"nextBodyChild\":\n        if (bodyChild.nextElementSibling === null) {\n          // The document has been fully parsed.\n          state = null\n        } else {\n          bodyChild = bodyChild.nextElementSibling\n          if (bodyChild.tagName === \"DIV\") {\n            state = \"firstAlineaElement\"\n          } else {\n            // <P/> is for footnotes\n            assert(\n              [\"BR\", \"HR\", \"P\"].includes(bodyChild.tagName),\n              `Unexpected tag name \"${bodyChild.tagName}\" for body child`,\n            )\n            // Stay in the same state to go to next bodyChild.\n          }\n        }\n        break\n      case \"nextParagraphChild\":\n        paragraphChild = paragraphChild!.nextElementSibling\n        if (paragraphChild === null) {\n          // The paragraph element has been fully parsed. Go to next parent element.\n          const lineText = lineElements!\n            .map((element) => element.textContent)\n            .join(\"\")\n            .trim()\n          if (lineText) {\n            const lineHtml = lineElements!\n              .map((element) => element.outerHTML)\n              .join(\"\")\n            if (\n              subdivisionHeadersText!.length === 0 ||\n              (isMultiLinesHeader && subdivisionAlineasText!.length === 0)\n            ) {\n              subdivisionHeadersHtml!.push(lineHtml)\n              subdivisionHeadersText!.push(lineText)\n            } else {\n              subdivisionAlineasHtml!.push(lineHtml)\n              subdivisionAlineasText!.push(lineText)\n            }\n          }\n          if (isMultiLinesHeader && subdivisionHeadersText!.length >= 2) {\n            isMultiLinesHeader = false\n          }\n          lineElements = null\n          state = nextParentState\n        } else {\n          state = \"paragraphChild\"\n        }\n        break\n      case \"nextSubAlineaElement\":\n        subAlineaElement = subAlineaElement!.nextElementSibling\n        if (subAlineaElement === null) {\n          // The alineaElement has been fully parsed. Go to next alineaElement.\n          state = \"nextAlineaElement\"\n        } else {\n          state = \"subAlineaElement\"\n        }\n        break\n      case \"paragraphChild\":\n        switch (paragraphChild!.tagName) {\n          case \"A\": {\n            lineElements!.push(paragraphChild!)\n            break\n          }\n          case \"BR\": {\n            const lineText = lineElements!\n              .map((element) => element.textContent)\n              .join(\"\")\n              .trim()\n            if (lineText) {\n              const lineHtml = lineElements!\n                .map((element) => element.outerHTML)\n                .join(\"\")\n              if (\n                subdivisionHeadersText!.length === 0 ||\n                (isMultiLinesHeader && subdivisionAlineasText!.length === 0)\n              ) {\n                subdivisionHeadersHtml!.push(lineHtml)\n                subdivisionHeadersText!.push(lineText)\n              } else {\n                subdivisionAlineasHtml!.push(lineHtml)\n                subdivisionAlineasText!.push(lineText)\n              }\n            }\n            lineElements = []\n            break\n          }\n          case \"DEL\": {\n            lineElements!.push(paragraphChild!)\n            break\n          }\n          case \"IMG\": {\n            lineElements!.push(paragraphChild!)\n            break\n          }\n          case \"SPAN\": {\n            const className = paragraphChild!.getAttribute(\"class\")\n            switch (className) {\n              case \"aEloiPastille\": {\n                // Skip pastillé SPAN.\n                break\n              }\n              case \"aEloiPastille0\": {\n                // Skip pastillé SPAN.\n                break\n              }\n              default:\n                lineElements!.push(paragraphChild!)\n            }\n            break\n          }\n          default:\n            return {\n              error: {\n                code: -3,\n                message: `Unexpected tag name for paragraph child: ${\n                  paragraphChild!.tagName\n                }`,\n              },\n              html,\n              page,\n            }\n        }\n        state = \"nextParagraphChild\"\n        break\n      case \"subAlineaElement\":\n        switch (subAlineaElement!.tagName) {\n          case \"P\":\n            nextParentState = \"nextSubAlineaElement\"\n            paragraphElement = subAlineaElement\n            state = \"firstParagraphChild\"\n            break\n          case \"TABLE\":\n            // TODO\n            state = \"nextSubAlineaElement\"\n            break\n          default:\n            return {\n              error: {\n                code: -4,\n                message: `Unexpected tag name for sub alinea element: ${\n                  subAlineaElement!.tagName\n                }`,\n              },\n              html,\n              page,\n            }\n        }\n        break\n        state = \"nextSubAlineaElement\"\n        break\n      default:\n        throw `Unexpected state: ${state}`\n    }\n  }\n\n  window.close() // Free memory.\n\n  return {\n    error: null,\n    html,\n    page,\n    subdivisions,\n    url: assembleeUrl,\n  }\n}\n\nexport async function retrieveTexteLoiParsed(\n  fetch: (\n    url: string | Request,\n    init?: RequestInit | undefined,\n  ) => Promise<Response>,\n  assembleeUrl: string,\n) {\n  const response = await fetch(assembleeUrl)\n  const page = await response.text()\n  if (!response.ok) {\n    return {\n      error: { code: response.status, message: response.statusText },\n      page,\n    }\n  }\n  return parseTexteLoi(assembleeUrl, page)\n}\n"],"mappings":"AAAA,OAAOA,MAAP,MAAmB,QAAnB;AACA,SAASC,KAAT,QAAsB,OAAtB;AAEA,OAAO,SAASC,aAAT,CAAuBC,YAAvB,EAA6CC,IAA7C,EAA2D;EAChE;EACA,MAAMC,YAAY,GAAGD,IAAI,CAACE,KAAL,CAAW,UAAX,CAArB;EACAN,MAAM,CAACO,WAAP,CAAmBF,YAAY,CAACG,MAAhC,EAAwC,CAAxC,EAA2CJ,IAA3C;EACA,IAAIK,IAAI,GAAGJ,YAAY,CAAC,CAAD,CAAZ,CAAgBK,IAAhB,EAAX;EACAV,MAAM,CAACS,IAAI,CAACE,UAAL,CAAgB,MAAhB,CAAD,CAAN;EACAX,MAAM,CAACS,IAAI,CAACG,QAAL,CAAc,QAAd,CAAD,CAAN;EACAH,IAAI,GAAI,QAAOA,IAAI,CAACI,SAAL,CAAe,CAAf,EAAkBJ,IAAI,CAACD,MAAL,GAAc,CAAhC,CAAmC,SAAlD,CAPgE,CAShE;;EACA,MAAM;IAAEM;EAAF,IAAa,IAAIb,KAAJ,CAAUQ,IAAV,CAAnB;EACA,MAAM;IAAEM;EAAF,IAAeD,MAArB;EACAd,MAAM,CAACO,WAAP,CAAmBQ,QAAQ,CAACC,QAAT,CAAkBR,MAArC,EAA6C,CAA7C;EACA,MAAMS,WAAW,GAAGF,QAAQ,CAACC,QAAT,CAAkB,CAAlB,CAApB;EACAhB,MAAM,CAACO,WAAP,CAAmBU,WAAW,CAACD,QAAZ,CAAqBR,MAAxC,EAAgD,CAAhD;EACA,MAAMU,WAAW,GAAGD,WAAW,CAACD,QAAZ,CAAqB,CAArB,CAApB;;EACA,IAAIb,YAAY,KAAK,sDAArB,EAA6E;IAC3E;IACAH,MAAM,CAACO,WAAP,CAAmBW,WAAW,CAACF,QAAZ,CAAqBR,MAAxC,EAAgD,CAAhD;IACA,MAAMW,UAAU,GAAGD,WAAW,CAACF,QAAZ,CAAqB,CAArB,CAAnB;IACAhB,MAAM,CAACO,WAAP,CAAmBY,UAAU,CAACC,OAA9B,EAAuC,KAAvC;IACA,MAAMC,aAAa,GAAGH,WAAW,CAACI,YAAZ,CACpBP,QAAQ,CAACQ,aAAT,CAAuB,KAAvB,CADoB,EAEpBJ,UAFoB,CAAtB;IAIAD,WAAW,CAACI,YAAZ,CAAyBP,QAAQ,CAACQ,aAAT,CAAuB,IAAvB,CAAzB,EAAuDJ,UAAvD;;IACA,KAAK,MAAMK,QAAX,IAAuB,CAAC,GAAGL,UAAU,CAACH,QAAf,CAAvB,EAAiD;MAC/C,IAAIQ,QAAQ,CAACC,YAAT,CAAsB,OAAtB,MAAmC,cAAvC,EAAuD;QACrD;MACD;;MACDJ,aAAa,CAACK,WAAd,CAA0BF,QAA1B;IACD;EACF;;EACD,IAAIN,WAAW,CAACF,QAAZ,CAAqBR,MAArB,GAA8B,CAAlC,EAAqC;IACnC;IACAM,MAAM,CAACa,KAAP,GAFmC,CAEpB;;IACf,OAAO;MACLC,KAAK,EAAE;QAAEC,IAAI,EAAE,CAAC,CAAT;QAAYC,OAAO,EAAE;MAArB,CADF;MAELrB,IAFK;MAGLL;IAHK,CAAP;EAKD;;EACDJ,MAAM,CAACO,WAAP,CAAmBW,WAAW,CAACF,QAAZ,CAAqB,CAArB,EAAwBI,OAA3C,EAAoD,KAApD,EA1CgE,CA2ChE;;EACA,IAAIW,SAAS,GAAGb,WAAW,CAACF,QAAZ,CAAqB,CAArB,CAAhB;EACAhB,MAAM,CAACO,WAAP,CAAmBwB,SAAS,CAACX,OAA7B,EAAsC,IAAtC;EACA,IAAIY,aAA6B,GAAG,IAApC;EACA,IAAIC,kBAA2B,GAAG,KAAlC;EACA,IAAIC,KAAoB,GAAG,IAA3B;EACA,IAAIC,MAAgB,GAAG,EAAvB;EACA,IAAIC,YAA8B,GAAG,IAArC;EACA,IAAIC,eAAe,GAAG,IAAtB;EACA,IAAIC,cAA8B,GAAG,IAArC;EACA,IAAIC,gBAAgC,GAAG,IAAvC;EACA,IAAIC,KAAoB,GAAG,eAA3B;EACA,IAAIC,gBAAgC,GAAG,IAAvC;EACA,MAAMC,YAAY,GAAG,EAArB;EACA,IAAIC,sBAAuC,GAAG,IAA9C;EACA,IAAIC,sBAAuC,GAAG,IAA9C;EACA,IAAIC,sBAAuC,GAAG,IAA9C;EACA,IAAIC,sBAAuC,GAAG,IAA9C;;EACA,OAAON,KAAK,KAAK,IAAjB,EAAuB;IACrB,QAAQA,KAAR;MACE,KAAK,eAAL;QACE,QAAQR,aAAa,CAAEZ,OAAvB;UACE,KAAK,KAAL;YACEoB,KAAK,GAAG,uBAAR;YACA;;UACF,KAAK,IAAL;YACE;YACAH,eAAe,GAAG,mBAAlB;YACAE,gBAAgB,GAAGP,aAAnB;YACAQ,KAAK,GAAG,qBAAR;YACA;;UACF,KAAK,GAAL;YACEH,eAAe,GAAG,mBAAlB;YACAE,gBAAgB,GAAGP,aAAnB;YACAQ,KAAK,GAAG,qBAAR;YACA;;UACF,KAAK,IAAL;YACE;YACAA,KAAK,GAAG,mBAAR;YACA;;UACF,KAAK,OAAL;YACE;YACAA,KAAK,GAAG,mBAAR;YACA;;UACF;YACE,OAAO;cACLZ,KAAK,EAAE;gBACLC,IAAI,EAAE,CAAC,CADF;gBAELC,OAAO,EAAG,2CACRE,aAAa,CAAEZ,OAChB;cAJI,CADF;cAOLX,IAPK;cAQLL;YARK,CAAP;QAxBJ;;QAmCA;;MACF,KAAK,oBAAL;QACE4B,aAAa,GAAGD,SAAS,CAACf,QAAV,CAAmB,CAAnB,CAAhB;;QACA,IAAIgB,aAAa,KAAKe,SAAtB,EAAiC;UAC/B;UACAP,KAAK,GAAG,eAAR;QACD,CAHD,MAGO;UACLA,KAAK,GAAG,eAAR;QACD;;QACD;;MACF,KAAK,qBAAL;QACEF,cAAc,GAAGC,gBAAgB,CAAEvB,QAAlB,CAA2B,CAA3B,CAAjB;;QACA,IAAIsB,cAAc,KAAKS,SAAvB,EAAkC;UAChC;UACAP,KAAK,GAAGH,eAAR;QACD,CAHD,MAGO;UACL,MAAMW,UAAU,GAAGT,gBAAgB,CAAEU,WAArC;UACA,MAAMC,YAAY,GAAG,CAACF,UAAU,IAAI,EAAf,EAClBG,SADkB,CACR,KADQ,EAElBC,OAFkB,CAEV,kBAFU,EAEU,EAFV,EAGlBA,OAHkB,CAGV,aAHU,EAGK,EAHL,EAIlBA,OAJkB,CAIV,uBAJU,EAIe,EAJf,EAKlBA,OALkB,CAKV,gBALU,EAKQ,EALR,EAMlBA,OANkB,CAMV,IANU,EAMJ,GANI,EAOlBA,OAPkB,CAOV,UAPU,EAOE,EAPF,EAQlB1C,IARkB,GASlB0C,OATkB,CASV,QATU,EASA,GATA,CAArB;UAUA,MAAMC,SAAS,GAAGH,YAAY,CAACI,WAAb,EAAlB;;UACA,IAAID,SAAS,KAAK,EAAlB,EAAsB;YACpB;YACA;YACA;YACA;YACAb,KAAK,GAAGH,eAAR;YACA;UACD;;UACD,MAAMkB,SAAS,GACbF,SAAS,CAACG,KAAV,CAAgB,yBAAhB,MAA+C,IAA/C,IACAH,SAAS,CAACG,KAAV,CAAgB,QAAhB,MAA8B,IAD9B,GAEI,CAFJ,GAGIH,SAAS,CAACG,KAAV,CAAgB,QAAhB,MAA8B,IAA9B,GACA,CADA,GAEAH,SAAS,CAACG,KAAV,CAAgB,UAAhB,MAAgC,IAAhC,IACAH,SAAS,CAACG,KAAV,CACE,8DADF,MAEM,IAHN,GAIA,CAJA,GAKAH,SAAS,CAACG,KAAV,CAAgB,SAAhB,MAA+B,IAA/B,GACA,CADA,GAEAH,SAAS,CAACG,KAAV,CAAgB,SAAhB,MAA+B,IAA/B,GACA,CADA,GAEAH,SAAS,CAACG,KAAV,CAAgB,aAAhB,MAAmC,IAAnC,GACA,CADA,GAEAH,SAAS,CAACG,KAAV,CAAgB,YAAhB,MAAkC,IAAlC,GACA,CADA,GAEAH,SAAS,CAACG,KAAV,CAAgB,WAAhB,MAAiC,IAAjC,GACA,CADA,GAEAH,SAAS,CAACG,KAAV,CAAgB,eAAhB,MAAqC,IAArC,GACA,CADA,GAEAH,SAAS,CAACG,KAAV,CAAgB,aAAhB,MAAmC,IAAnC,IACA;UACA;UACA;UACA;UACA;UACA;UACAH,SAAS,CAACG,KAAV,CAAgB,qBAAhB,MAA2C,IAP3C,GAQA,CARA,GASA,IAhCN;;UAiCA,IAAID,SAAS,KAAK,IAAd,IAAsBb,YAAY,CAAClC,MAAb,KAAwB,CAAlD,EAAqD;YACnD,IAAI6C,SAAS,CAACG,KAAV,CAAgB,mCAAhB,MAAyD,IAA7D,EAAmE,CACjE;cACA;cACA;cACA;YACD,CALD,MAKO,IACLH,SAAS,KAAK,0CADT,EAEL,CACA;YACD,CAJM,MAIA,IAAIA,SAAS,KAAK,wCAAlB,EAA4D,CACjE;YACD,CAFM,MAEA;cACLI,OAAO,CAACC,GAAR,CACG,2BAA0BL,SAAU,uCAAsClD,YAAa,EAD1F;YAGD,CAhBkD,CAiBnD;;;YACAqC,KAAK,GAAGH,eAAR;YACA;UACD;;UACD,IAAIkB,SAAS,KAAK,IAAlB,EAAwB;YACtBrB,KAAK,GAAGqB,SAAR;;YACA,OAAOpB,MAAM,CAAC3B,MAAP,GAAgB,CAAhB,IAAqB0B,KAAK,GAAGC,MAAM,CAACA,MAAM,CAAC3B,MAAP,GAAgB,CAAjB,CAA1C,EAA+D;cAC7D2B,MAAM,CAACwB,GAAP;YACD;;YACD,IAAIxB,MAAM,CAAC3B,MAAP,KAAkB,CAAlB,IAAuB0B,KAAK,GAAGC,MAAM,CAACA,MAAM,CAAC3B,MAAP,GAAgB,CAAjB,CAAzC,EAA8D;cAC5D2B,MAAM,CAACyB,IAAP,CAAY1B,KAAZ;YACD,CAPqB,CAQtB;;;YACAD,kBAAkB,GAChBoB,SAAS,CAACG,KAAV,CAAgB,aAAhB,MAAmC,IAAnC,IACAH,SAAS,CAACG,KAAV,CAAgB,qBAAhB,MAA2C,IAF7C;YAGAb,sBAAsB,GAAG,EAAzB;YACAC,sBAAsB,GAAG,EAAzB;YACAC,sBAAsB,GAAG,EAAzB;YACAC,sBAAsB,GAAG,EAAzB;YACAJ,YAAY,CAACkB,IAAb,CAAkB;cAChBnD,IAAI,EAAE;gBACJoD,OAAO,EAAElB,sBADL;gBAEJmB,OAAO,EAAEjB;cAFL,CADU;cAKhBkB,EAAE,EAAE,OAAOb,YALK;cAMhBhB,KAAK,EAAEA,KAAK,GAAG,CANC;cAOhB8B,aAAa,EAAE7B,MAAM,CAAC3B,MAPN;cAQhByD,IAAI,EAAE;gBACJJ,OAAO,EAAEjB,sBADL;gBAEJkB,OAAO,EAAEhB;cAFL;YARU,CAAlB;UAaD;;UACDV,YAAY,GAAG,EAAf;UACAI,KAAK,GAAG,gBAAR;QACD;;QACD;;MACF,KAAK,uBAAL;QACEC,gBAAgB,GAAGT,aAAa,CAAEhB,QAAf,CAAwB,CAAxB,CAAnB;;QACA,IAAIyB,gBAAgB,KAAKM,SAAzB,EAAoC;UAClC;UACAP,KAAK,GAAG,mBAAR;QACD,CAHD,MAGO;UACLA,KAAK,GAAG,kBAAR;QACD;;QACD;;MACF,KAAK,mBAAL;QACER,aAAa,GAAGA,aAAa,CAAEkC,kBAA/B;;QACA,IAAIlC,aAAa,KAAK,IAAtB,EAA4B;UAC1B;UACAQ,KAAK,GAAG,eAAR;QACD,CAHD,MAGO;UACLA,KAAK,GAAG,eAAR;QACD;;QACD;;MACF,KAAK,eAAL;QACE,IAAIT,SAAS,CAACmC,kBAAV,KAAiC,IAArC,EAA2C;UACzC;UACA1B,KAAK,GAAG,IAAR;QACD,CAHD,MAGO;UACLT,SAAS,GAAGA,SAAS,CAACmC,kBAAtB;;UACA,IAAInC,SAAS,CAACX,OAAV,KAAsB,KAA1B,EAAiC;YAC/BoB,KAAK,GAAG,oBAAR;UACD,CAFD,MAEO;YACL;YACAxC,MAAM,CACJ,CAAC,IAAD,EAAO,IAAP,EAAa,GAAb,EAAkBmE,QAAlB,CAA2BpC,SAAS,CAACX,OAArC,CADI,EAEH,wBAAuBW,SAAS,CAACX,OAAQ,kBAFtC,CAAN,CAFK,CAML;UACD;QACF;;QACD;;MACF,KAAK,oBAAL;QACEkB,cAAc,GAAGA,cAAc,CAAE4B,kBAAjC;;QACA,IAAI5B,cAAc,KAAK,IAAvB,EAA6B;UAC3B;UACA,MAAM8B,QAAQ,GAAGhC,YAAY,CAC1BiC,GADc,CACTC,OAAD,IAAaA,OAAO,CAACrB,WADX,EAEdsB,IAFc,CAET,EAFS,EAGd7D,IAHc,EAAjB;;UAIA,IAAI0D,QAAJ,EAAc;YACZ,MAAMI,QAAQ,GAAGpC,YAAY,CAC1BiC,GADc,CACTC,OAAD,IAAaA,OAAO,CAACG,SADX,EAEdF,IAFc,CAET,EAFS,CAAjB;;YAGA,IACEzB,sBAAsB,CAAEtC,MAAxB,KAAmC,CAAnC,IACCyB,kBAAkB,IAAIW,sBAAsB,CAAEpC,MAAxB,KAAmC,CAF5D,EAGE;cACAqC,sBAAsB,CAAEe,IAAxB,CAA6BY,QAA7B;cACA1B,sBAAsB,CAAEc,IAAxB,CAA6BQ,QAA7B;YACD,CAND,MAMO;cACLzB,sBAAsB,CAAEiB,IAAxB,CAA6BY,QAA7B;cACA5B,sBAAsB,CAAEgB,IAAxB,CAA6BQ,QAA7B;YACD;UACF;;UACD,IAAInC,kBAAkB,IAAIa,sBAAsB,CAAEtC,MAAxB,IAAkC,CAA5D,EAA+D;YAC7DyB,kBAAkB,GAAG,KAArB;UACD;;UACDG,YAAY,GAAG,IAAf;UACAI,KAAK,GAAGH,eAAR;QACD,CA1BD,MA0BO;UACLG,KAAK,GAAG,gBAAR;QACD;;QACD;;MACF,KAAK,sBAAL;QACEC,gBAAgB,GAAGA,gBAAgB,CAAEyB,kBAArC;;QACA,IAAIzB,gBAAgB,KAAK,IAAzB,EAA+B;UAC7B;UACAD,KAAK,GAAG,mBAAR;QACD,CAHD,MAGO;UACLA,KAAK,GAAG,kBAAR;QACD;;QACD;;MACF,KAAK,gBAAL;QACE,QAAQF,cAAc,CAAElB,OAAxB;UACE,KAAK,GAAL;YAAU;cACRgB,YAAY,CAAEwB,IAAd,CAAmBtB,cAAnB;cACA;YACD;;UACD,KAAK,IAAL;YAAW;cACT,MAAM8B,QAAQ,GAAGhC,YAAY,CAC1BiC,GADc,CACTC,OAAD,IAAaA,OAAO,CAACrB,WADX,EAEdsB,IAFc,CAET,EAFS,EAGd7D,IAHc,EAAjB;;cAIA,IAAI0D,QAAJ,EAAc;gBACZ,MAAMI,QAAQ,GAAGpC,YAAY,CAC1BiC,GADc,CACTC,OAAD,IAAaA,OAAO,CAACG,SADX,EAEdF,IAFc,CAET,EAFS,CAAjB;;gBAGA,IACEzB,sBAAsB,CAAEtC,MAAxB,KAAmC,CAAnC,IACCyB,kBAAkB,IAAIW,sBAAsB,CAAEpC,MAAxB,KAAmC,CAF5D,EAGE;kBACAqC,sBAAsB,CAAEe,IAAxB,CAA6BY,QAA7B;kBACA1B,sBAAsB,CAAEc,IAAxB,CAA6BQ,QAA7B;gBACD,CAND,MAMO;kBACLzB,sBAAsB,CAAEiB,IAAxB,CAA6BY,QAA7B;kBACA5B,sBAAsB,CAAEgB,IAAxB,CAA6BQ,QAA7B;gBACD;cACF;;cACDhC,YAAY,GAAG,EAAf;cACA;YACD;;UACD,KAAK,KAAL;YAAY;cACVA,YAAY,CAAEwB,IAAd,CAAmBtB,cAAnB;cACA;YACD;;UACD,KAAK,KAAL;YAAY;cACVF,YAAY,CAAEwB,IAAd,CAAmBtB,cAAnB;cACA;YACD;;UACD,KAAK,MAAL;YAAa;cACX,MAAMoC,SAAS,GAAGpC,cAAc,CAAEb,YAAhB,CAA6B,OAA7B,CAAlB;;cACA,QAAQiD,SAAR;gBACE,KAAK,eAAL;kBAAsB;oBACpB;oBACA;kBACD;;gBACD,KAAK,gBAAL;kBAAuB;oBACrB;oBACA;kBACD;;gBACD;kBACEtC,YAAY,CAAEwB,IAAd,CAAmBtB,cAAnB;cAVJ;;cAYA;YACD;;UACD;YACE,OAAO;cACLV,KAAK,EAAE;gBACLC,IAAI,EAAE,CAAC,CADF;gBAELC,OAAO,EAAG,4CACRQ,cAAc,CAAElB,OACjB;cAJI,CADF;cAOLX,IAPK;cAQLL;YARK,CAAP;QArDJ;;QAgEAoC,KAAK,GAAG,oBAAR;QACA;;MACF,KAAK,kBAAL;QACE,QAAQC,gBAAgB,CAAErB,OAA1B;UACE,KAAK,GAAL;YACEiB,eAAe,GAAG,sBAAlB;YACAE,gBAAgB,GAAGE,gBAAnB;YACAD,KAAK,GAAG,qBAAR;YACA;;UACF,KAAK,OAAL;YACE;YACAA,KAAK,GAAG,sBAAR;YACA;;UACF;YACE,OAAO;cACLZ,KAAK,EAAE;gBACLC,IAAI,EAAE,CAAC,CADF;gBAELC,OAAO,EAAG,+CACRW,gBAAgB,CAAErB,OACnB;cAJI,CADF;cAOLX,IAPK;cAQLL;YARK,CAAP;QAXJ;;QAsBA;QACAoC,KAAK,GAAG,sBAAR;QACA;;MACF;QACE,MAAO,qBAAoBA,KAAM,EAAjC;IA5UJ;EA8UD;;EAED1B,MAAM,CAACa,KAAP,GA9YgE,CA8YjD;;EAEf,OAAO;IACLC,KAAK,EAAE,IADF;IAELnB,IAFK;IAGLL,IAHK;IAILsC,YAJK;IAKLiC,GAAG,EAAExE;EALA,CAAP;AAOD;AAED,OAAO,eAAeyE,sBAAf,CACLC,KADK,EAKL1E,YALK,EAML;EACA,MAAM2E,QAAQ,GAAG,MAAMD,KAAK,CAAC1E,YAAD,CAA5B;EACA,MAAMC,IAAI,GAAG,MAAM0E,QAAQ,CAACb,IAAT,EAAnB;;EACA,IAAI,CAACa,QAAQ,CAACC,EAAd,EAAkB;IAChB,OAAO;MACLnD,KAAK,EAAE;QAAEC,IAAI,EAAEiD,QAAQ,CAACE,MAAjB;QAAyBlD,OAAO,EAAEgD,QAAQ,CAACG;MAA3C,CADF;MAEL7E;IAFK,CAAP;EAID;;EACD,OAAOF,aAAa,CAACC,YAAD,EAAeC,IAAf,CAApB;AACD"}
|
package/lib/parsers/index.js
CHANGED
|
@@ -1,3 +1,36 @@
|
|
|
1
|
-
|
|
2
|
-
|
|
3
|
-
|
|
1
|
+
"use strict";
|
|
2
|
+
|
|
3
|
+
require("core-js/modules/es.object.define-property.js");
|
|
4
|
+
|
|
5
|
+
Object.defineProperty(exports, "__esModule", {
|
|
6
|
+
value: true
|
|
7
|
+
});
|
|
8
|
+
Object.defineProperty(exports, "iterRechercheAmendements", {
|
|
9
|
+
enumerable: true,
|
|
10
|
+
get: function get() {
|
|
11
|
+
return _recherche_amendements.iterRechercheAmendements;
|
|
12
|
+
}
|
|
13
|
+
});
|
|
14
|
+
Object.defineProperty(exports, "iterRechercheRawAmendements", {
|
|
15
|
+
enumerable: true,
|
|
16
|
+
get: function get() {
|
|
17
|
+
return _recherche_amendements.iterRechercheRawAmendements;
|
|
18
|
+
}
|
|
19
|
+
});
|
|
20
|
+
Object.defineProperty(exports, "parseTexteLoi", {
|
|
21
|
+
enumerable: true,
|
|
22
|
+
get: function get() {
|
|
23
|
+
return _documents.parseTexteLoi;
|
|
24
|
+
}
|
|
25
|
+
});
|
|
26
|
+
Object.defineProperty(exports, "retrieveTexteLoiParsed", {
|
|
27
|
+
enumerable: true,
|
|
28
|
+
get: function get() {
|
|
29
|
+
return _documents.retrieveTexteLoiParsed;
|
|
30
|
+
}
|
|
31
|
+
});
|
|
32
|
+
|
|
33
|
+
var _documents = require("./documents");
|
|
34
|
+
|
|
35
|
+
var _recherche_amendements = require("./recherche_amendements");
|
|
36
|
+
//# sourceMappingURL=data:application/json;charset=utf-8;base64,eyJ2ZXJzaW9uIjozLCJuYW1lcyI6W10sInNvdXJjZXMiOlsiLi4vLi4vc3JjL3BhcnNlcnMvaW5kZXgudHMiXSwic291cmNlc0NvbnRlbnQiOlsiZXhwb3J0IHsgcGFyc2VUZXh0ZUxvaSwgcmV0cmlldmVUZXh0ZUxvaVBhcnNlZCB9IGZyb20gXCIuL2RvY3VtZW50c1wiXG5leHBvcnQge1xuICBpdGVyUmVjaGVyY2hlQW1lbmRlbWVudHMsXG4gIGl0ZXJSZWNoZXJjaGVSYXdBbWVuZGVtZW50cyxcbn0gZnJvbSBcIi4vcmVjaGVyY2hlX2FtZW5kZW1lbnRzXCJcbiJdLCJtYXBwaW5ncyI6Ijs7Ozs7Ozs7Ozs7Ozs7Ozs7Ozs7Ozs7Ozs7Ozs7Ozs7QUFBQTs7QUFDQSJ9
|
|
@@ -0,0 +1,3 @@
|
|
|
1
|
+
export { parseTexteLoi, retrieveTexteLoiParsed } from "./documents.mjs";
|
|
2
|
+
export { iterRechercheAmendements, iterRechercheRawAmendements } from "./recherche_amendements.mjs";
|
|
3
|
+
//# sourceMappingURL=data:application/json;charset=utf-8;base64,eyJ2ZXJzaW9uIjozLCJuYW1lcyI6WyJwYXJzZVRleHRlTG9pIiwicmV0cmlldmVUZXh0ZUxvaVBhcnNlZCIsIml0ZXJSZWNoZXJjaGVBbWVuZGVtZW50cyIsIml0ZXJSZWNoZXJjaGVSYXdBbWVuZGVtZW50cyJdLCJzb3VyY2VzIjpbIi4uLy4uL3NyYy9wYXJzZXJzL2luZGV4LnRzIl0sInNvdXJjZXNDb250ZW50IjpbImV4cG9ydCB7IHBhcnNlVGV4dGVMb2ksIHJldHJpZXZlVGV4dGVMb2lQYXJzZWQgfSBmcm9tIFwiLi9kb2N1bWVudHNcIlxuZXhwb3J0IHtcbiAgaXRlclJlY2hlcmNoZUFtZW5kZW1lbnRzLFxuICBpdGVyUmVjaGVyY2hlUmF3QW1lbmRlbWVudHMsXG59IGZyb20gXCIuL3JlY2hlcmNoZV9hbWVuZGVtZW50c1wiXG4iXSwibWFwcGluZ3MiOiJTQUFTQSxhLEVBQWVDLHNCO1NBRXRCQyx3QixFQUNBQywyQiJ9
|