@tricoteuses/senat 2.22.3 → 2.22.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (258) hide show
  1. package/lib/aggregates.d.ts +52 -0
  2. package/lib/aggregates.js +930 -0
  3. package/lib/aggregates.mjs +713 -0
  4. package/lib/aggregates.ts +833 -0
  5. package/lib/config.d.ts +10 -0
  6. package/lib/config.js +16 -0
  7. package/lib/config.mjs +16 -0
  8. package/lib/config.ts +26 -0
  9. package/lib/databases.d.ts +2 -0
  10. package/lib/databases.js +26 -0
  11. package/lib/databases.mjs +57 -0
  12. package/lib/databases.ts +71 -0
  13. package/lib/datasets.d.ts +34 -0
  14. package/lib/datasets.js +233 -0
  15. package/lib/datasets.mjs +78 -0
  16. package/lib/datasets.ts +118 -0
  17. package/lib/fields.d.ts +10 -0
  18. package/lib/fields.js +68 -0
  19. package/lib/fields.mjs +22 -0
  20. package/lib/fields.ts +29 -0
  21. package/lib/git.d.ts +26 -0
  22. package/lib/git.js +167 -0
  23. package/lib/index.d.ts +13 -0
  24. package/lib/index.js +1 -0
  25. package/lib/index.mjs +7 -0
  26. package/lib/index.ts +64 -0
  27. package/lib/inserters.d.ts +98 -0
  28. package/lib/inserters.js +500 -0
  29. package/lib/inserters.mjs +360 -0
  30. package/lib/inserters.ts +521 -0
  31. package/lib/legislatures.json +38 -0
  32. package/lib/loaders.d.ts +58 -0
  33. package/lib/loaders.js +286 -0
  34. package/lib/loaders.mjs +158 -0
  35. package/lib/loaders.ts +271 -0
  36. package/lib/model/agenda.d.ts +6 -0
  37. package/lib/model/agenda.js +148 -0
  38. package/lib/model/ameli.d.ts +51 -0
  39. package/lib/model/ameli.js +149 -0
  40. package/lib/model/ameli.mjs +84 -0
  41. package/lib/model/ameli.ts +100 -0
  42. package/lib/model/commission.d.ts +18 -0
  43. package/lib/model/commission.js +269 -0
  44. package/lib/model/debats.d.ts +67 -0
  45. package/lib/model/debats.js +95 -0
  46. package/lib/model/debats.mjs +43 -0
  47. package/lib/model/debats.ts +68 -0
  48. package/lib/model/documents.d.ts +12 -0
  49. package/lib/model/documents.js +151 -0
  50. package/lib/model/dosleg.d.ts +7 -0
  51. package/lib/model/dosleg.js +326 -0
  52. package/lib/model/dosleg.mjs +196 -0
  53. package/lib/model/dosleg.ts +240 -0
  54. package/lib/model/index.d.ts +7 -0
  55. package/lib/model/index.js +7 -0
  56. package/lib/model/index.mjs +5 -0
  57. package/lib/model/index.ts +15 -0
  58. package/lib/model/questions.d.ts +45 -0
  59. package/lib/model/questions.js +89 -0
  60. package/lib/model/questions.mjs +71 -0
  61. package/lib/model/questions.ts +93 -0
  62. package/lib/model/scrutins.d.ts +13 -0
  63. package/lib/model/scrutins.js +114 -0
  64. package/lib/model/seance.d.ts +3 -0
  65. package/lib/model/seance.js +267 -0
  66. package/lib/model/sens.d.ts +146 -0
  67. package/lib/model/sens.js +454 -0
  68. package/lib/model/sens.mjs +415 -0
  69. package/lib/model/sens.ts +516 -0
  70. package/lib/model/texte.d.ts +7 -0
  71. package/lib/model/texte.js +256 -0
  72. package/lib/model/texte.mjs +208 -0
  73. package/lib/model/texte.ts +229 -0
  74. package/lib/model/util.d.ts +9 -0
  75. package/lib/model/util.js +38 -0
  76. package/lib/model/util.mjs +19 -0
  77. package/lib/model/util.ts +32 -0
  78. package/lib/parsers/texte.d.ts +7 -0
  79. package/lib/parsers/texte.js +228 -0
  80. package/lib/raw_types/ameli.d.ts +914 -0
  81. package/lib/raw_types/ameli.js +5 -0
  82. package/lib/raw_types/ameli.mjs +163 -0
  83. package/lib/raw_types/debats.d.ts +207 -0
  84. package/lib/raw_types/debats.js +5 -0
  85. package/lib/raw_types/debats.mjs +58 -0
  86. package/lib/raw_types/dosleg.d.ts +1619 -0
  87. package/lib/raw_types/dosleg.js +5 -0
  88. package/lib/raw_types/dosleg.mjs +438 -0
  89. package/lib/raw_types/questions.d.ts +419 -0
  90. package/lib/raw_types/questions.js +5 -0
  91. package/lib/raw_types/questions.mjs +11 -0
  92. package/lib/raw_types/senat.d.ts +11368 -0
  93. package/lib/raw_types/senat.js +5 -0
  94. package/lib/raw_types/sens.d.ts +8248 -0
  95. package/lib/raw_types/sens.js +5 -0
  96. package/lib/raw_types/sens.mjs +508 -0
  97. package/lib/raw_types_kysely/ameli.d.ts +915 -0
  98. package/lib/raw_types_kysely/ameli.js +7 -0
  99. package/lib/raw_types_kysely/ameli.mjs +5 -0
  100. package/lib/raw_types_kysely/ameli.ts +951 -0
  101. package/lib/raw_types_kysely/debats.d.ts +207 -0
  102. package/lib/raw_types_kysely/debats.js +7 -0
  103. package/lib/raw_types_kysely/debats.mjs +5 -0
  104. package/lib/raw_types_kysely/debats.ts +222 -0
  105. package/lib/raw_types_kysely/dosleg.d.ts +3532 -0
  106. package/lib/raw_types_kysely/dosleg.js +7 -0
  107. package/lib/raw_types_kysely/dosleg.mjs +5 -0
  108. package/lib/raw_types_kysely/dosleg.ts +3621 -0
  109. package/lib/raw_types_kysely/questions.d.ts +414 -0
  110. package/lib/raw_types_kysely/questions.js +7 -0
  111. package/lib/raw_types_kysely/questions.mjs +5 -0
  112. package/lib/raw_types_kysely/questions.ts +426 -0
  113. package/lib/raw_types_kysely/sens.d.ts +4394 -0
  114. package/lib/raw_types_kysely/sens.js +7 -0
  115. package/lib/raw_types_kysely/sens.mjs +5 -0
  116. package/lib/raw_types_kysely/sens.ts +4499 -0
  117. package/lib/raw_types_schemats/ameli.d.ts +539 -0
  118. package/lib/raw_types_schemats/ameli.js +2 -0
  119. package/lib/raw_types_schemats/ameli.mjs +2 -0
  120. package/lib/raw_types_schemats/ameli.ts +601 -0
  121. package/lib/raw_types_schemats/debats.d.ts +127 -0
  122. package/lib/raw_types_schemats/debats.js +2 -0
  123. package/lib/raw_types_schemats/debats.mjs +2 -0
  124. package/lib/raw_types_schemats/debats.ts +145 -0
  125. package/lib/raw_types_schemats/dosleg.d.ts +977 -0
  126. package/lib/raw_types_schemats/dosleg.js +2 -0
  127. package/lib/raw_types_schemats/dosleg.mjs +2 -0
  128. package/lib/raw_types_schemats/dosleg.ts +2193 -0
  129. package/lib/raw_types_schemats/questions.d.ts +235 -0
  130. package/lib/raw_types_schemats/questions.js +2 -0
  131. package/lib/raw_types_schemats/questions.mjs +2 -0
  132. package/lib/raw_types_schemats/questions.ts +249 -0
  133. package/lib/raw_types_schemats/sens.d.ts +6915 -0
  134. package/lib/raw_types_schemats/sens.js +2 -0
  135. package/lib/raw_types_schemats/sens.mjs +2 -0
  136. package/lib/raw_types_schemats/sens.ts +2907 -0
  137. package/lib/scripts/convert_data.d.ts +1 -0
  138. package/lib/scripts/convert_data.js +354 -0
  139. package/lib/scripts/convert_data.mjs +181 -0
  140. package/lib/scripts/convert_data.ts +243 -0
  141. package/lib/scripts/data-download.d.ts +1 -0
  142. package/lib/scripts/data-download.js +12 -0
  143. package/lib/scripts/datautil.d.ts +8 -0
  144. package/lib/scripts/datautil.js +34 -0
  145. package/lib/scripts/datautil.mjs +16 -0
  146. package/lib/scripts/datautil.ts +19 -0
  147. package/lib/scripts/images/transparent_150x192.jpg +0 -0
  148. package/lib/scripts/images/transparent_155x225.jpg +0 -0
  149. package/lib/scripts/parse_textes.d.ts +1 -0
  150. package/lib/scripts/parse_textes.js +44 -0
  151. package/lib/scripts/parse_textes.mjs +46 -0
  152. package/lib/scripts/parse_textes.ts +65 -0
  153. package/lib/scripts/retrieve_agenda.d.ts +1 -0
  154. package/lib/scripts/retrieve_agenda.js +132 -0
  155. package/lib/scripts/retrieve_cr_commission.d.ts +1 -0
  156. package/lib/scripts/retrieve_cr_commission.js +364 -0
  157. package/lib/scripts/retrieve_cr_seance.d.ts +6 -0
  158. package/lib/scripts/retrieve_cr_seance.js +347 -0
  159. package/lib/scripts/retrieve_documents.d.ts +3 -0
  160. package/lib/scripts/retrieve_documents.js +219 -0
  161. package/lib/scripts/retrieve_documents.mjs +249 -0
  162. package/lib/scripts/retrieve_documents.ts +298 -0
  163. package/lib/scripts/retrieve_open_data.d.ts +1 -0
  164. package/lib/scripts/retrieve_open_data.js +315 -0
  165. package/lib/scripts/retrieve_open_data.mjs +217 -0
  166. package/lib/scripts/retrieve_open_data.ts +268 -0
  167. package/lib/scripts/retrieve_senateurs_photos.d.ts +1 -0
  168. package/lib/scripts/retrieve_senateurs_photos.js +147 -0
  169. package/lib/scripts/retrieve_senateurs_photos.mjs +147 -0
  170. package/lib/scripts/retrieve_senateurs_photos.ts +177 -0
  171. package/lib/scripts/retrieve_videos.d.ts +1 -0
  172. package/lib/scripts/retrieve_videos.js +461 -0
  173. package/lib/scripts/shared/cli_helpers.d.ts +95 -0
  174. package/lib/scripts/shared/cli_helpers.js +91 -0
  175. package/lib/scripts/shared/cli_helpers.ts +36 -0
  176. package/lib/scripts/shared/util.d.ts +4 -0
  177. package/lib/scripts/shared/util.js +35 -0
  178. package/lib/scripts/shared/util.ts +33 -0
  179. package/lib/scripts/test_iter_load.d.ts +1 -0
  180. package/lib/scripts/test_iter_load.js +12 -0
  181. package/lib/src/conversion_textes.js +10 -1
  182. package/lib/src/index.d.ts +1 -1
  183. package/lib/src/index.js +1 -1
  184. package/lib/src/loaders.d.ts +1 -0
  185. package/lib/src/loaders.js +1 -0
  186. package/lib/src/model/ameli.js +1 -0
  187. package/lib/src/parsers/texte.js +2 -2
  188. package/lib/src/scripts/convert_data.js +11 -10
  189. package/lib/src/scripts/retrieve_documents.d.ts +1 -1
  190. package/lib/src/scripts/retrieve_documents.js +25 -10
  191. package/lib/src/scripts/retrieve_open_data.js +1 -1
  192. package/lib/src/types/sessions.d.ts +5 -4
  193. package/lib/src/types/sessions.js +10 -75
  194. package/lib/src/types/texte.d.ts +2 -0
  195. package/lib/strings.d.ts +1 -0
  196. package/lib/strings.js +18 -0
  197. package/lib/strings.mjs +18 -0
  198. package/lib/strings.ts +26 -0
  199. package/lib/types/agenda.d.ts +44 -0
  200. package/lib/types/agenda.js +1 -0
  201. package/lib/types/ameli.d.ts +5 -0
  202. package/lib/types/ameli.js +1 -0
  203. package/lib/types/ameli.mjs +13 -0
  204. package/lib/types/ameli.ts +21 -0
  205. package/lib/types/compte_rendu.d.ts +83 -0
  206. package/lib/types/compte_rendu.js +1 -0
  207. package/lib/types/debats.d.ts +2 -0
  208. package/lib/types/debats.js +1 -0
  209. package/lib/types/debats.mjs +2 -0
  210. package/lib/types/debats.ts +6 -0
  211. package/lib/types/dosleg.d.ts +70 -0
  212. package/lib/types/dosleg.js +1 -0
  213. package/lib/types/dosleg.mjs +151 -0
  214. package/lib/types/dosleg.ts +284 -0
  215. package/lib/types/questions.d.ts +2 -0
  216. package/lib/types/questions.js +1 -0
  217. package/lib/types/questions.mjs +1 -0
  218. package/lib/types/questions.ts +3 -0
  219. package/lib/types/sens.d.ts +10 -0
  220. package/lib/types/sens.js +1 -0
  221. package/lib/types/sens.mjs +1 -0
  222. package/lib/types/sens.ts +12 -0
  223. package/lib/types/sessions.d.ts +5 -0
  224. package/lib/types/sessions.js +84 -0
  225. package/lib/types/sessions.mjs +43 -0
  226. package/lib/types/sessions.ts +42 -0
  227. package/lib/types/texte.d.ts +74 -0
  228. package/lib/types/texte.js +16 -0
  229. package/lib/types/texte.mjs +16 -0
  230. package/lib/types/texte.ts +76 -0
  231. package/lib/typings/windows-1252.d.js +2 -0
  232. package/lib/typings/windows-1252.d.mjs +2 -0
  233. package/lib/typings/windows-1252.d.ts +11 -0
  234. package/lib/utils/cr_spliting.d.ts +28 -0
  235. package/lib/utils/cr_spliting.js +265 -0
  236. package/lib/utils/date.d.ts +10 -0
  237. package/lib/utils/date.js +100 -0
  238. package/lib/utils/nvs-timecode.d.ts +7 -0
  239. package/lib/utils/nvs-timecode.js +79 -0
  240. package/lib/utils/reunion_grouping.d.ts +9 -0
  241. package/lib/utils/reunion_grouping.js +361 -0
  242. package/lib/utils/reunion_odj_building.d.ts +5 -0
  243. package/lib/utils/reunion_odj_building.js +154 -0
  244. package/lib/utils/reunion_parsing.d.ts +23 -0
  245. package/lib/utils/reunion_parsing.js +209 -0
  246. package/lib/utils/scoring.d.ts +14 -0
  247. package/lib/utils/scoring.js +147 -0
  248. package/lib/utils/string_cleaning.d.ts +7 -0
  249. package/lib/utils/string_cleaning.js +57 -0
  250. package/lib/validators/config.d.ts +9 -0
  251. package/lib/validators/config.js +10 -0
  252. package/lib/validators/config.mjs +54 -0
  253. package/lib/validators/config.ts +79 -0
  254. package/lib/validators/senat.d.ts +0 -0
  255. package/lib/validators/senat.js +28 -0
  256. package/lib/validators/senat.mjs +24 -0
  257. package/lib/validators/senat.ts +26 -0
  258. package/package.json +5 -5
@@ -0,0 +1 @@
1
+ export {};
@@ -0,0 +1,354 @@
1
+ import assert from "assert";
2
+ import commandLineArgs from "command-line-args";
3
+ import fs from "fs-extra";
4
+ import path from "path";
5
+ import pLimit from "p-limit";
6
+ import * as git from "../git";
7
+ import { datasets, EnabledDatasets, getEnabledDatasets } from "../datasets";
8
+ import { DATA_ORIGINAL_FOLDER, DATA_TRANSFORMED_FOLDER, DOCUMENT_METADATA_FILE, DOSLEG_DOSSIERS_FOLDER, SCRUTINS_FOLDER, RAPPORT_FOLDER, SENS_CIRCONSCRIPTIONS_FOLDER, SENS_ORGANISMES_FOLDER, SENS_SENATEURS_FOLDER, TEXTE_FOLDER } from "../loaders";
9
+ import { findAllAmendements, findAllCirconscriptions, findAllDebats, findAllDossiers, findAllScrutins, findAllOrganismes, findAllQuestions, findAllSens, findAllTextes, findAllRapports, } from "../model";
10
+ import { processRapport, processTexte } from "./retrieve_documents";
11
+ import { buildActesLegislatifs } from "../model/dosleg";
12
+ import { UNDEFINED_SESSION } from "../types/sessions";
13
+ import { getSessionFromDate, getSessionFromSignet } from "./datautil";
14
+ import { commonOptions } from "./shared/cli_helpers";
15
+ import { ensureAndClearDir } from "./shared/util";
16
+ const optionsDefinitions = [...commonOptions];
17
+ const options = commandLineArgs(optionsDefinitions);
18
+ const SENAT_TEXTE_XML_BASE_URL = "https://www.senat.fr/akomantoso/";
19
+ const SENAT_TEXTE_BASE_URL = "https://www.senat.fr/leg/";
20
+ const SENAT_EXPOSE_DES_MOTIFS_BASE_URL = "https://www.senat.fr/leg/exposes-des-motifs/";
21
+ const SENAT_RAPPORT_BASE_URL = "https://www.senat.fr/rap/";
22
+ function commitGit(datasetDir, options, exitCode) {
23
+ if (options.commit) {
24
+ const errorCode = git.commitAndPush(datasetDir, "Nouvelle moisson", options.remote);
25
+ if ((exitCode === 10 && errorCode !== 10) || (exitCode === 0 && errorCode !== 0 && errorCode !== 10)) {
26
+ exitCode = errorCode;
27
+ }
28
+ }
29
+ return exitCode;
30
+ }
31
+ async function convertData() {
32
+ const dataDir = options["dataDir"];
33
+ assert(dataDir, "Missing argument: data directory");
34
+ const enabledDatasets = getEnabledDatasets(options["categories"]);
35
+ console.time("data transformation time");
36
+ let exitCode = 0;
37
+ if (enabledDatasets & EnabledDatasets.Ameli) {
38
+ try {
39
+ await convertDatasetAmeli(dataDir, options);
40
+ const ameliDir = path.join(dataDir, datasets.ameli.database);
41
+ exitCode = commitGit(ameliDir, options, exitCode);
42
+ }
43
+ catch (error) {
44
+ console.error(`Error converting Ameli dataset:`, error);
45
+ }
46
+ }
47
+ if (enabledDatasets & EnabledDatasets.Debats) {
48
+ try {
49
+ await convertDatasetDebats(dataDir, options);
50
+ const debatsDir = path.join(dataDir, datasets.debats.database);
51
+ exitCode = commitGit(debatsDir, options, exitCode);
52
+ }
53
+ catch (error) {
54
+ console.error(`Error converting Debats dataset:`, error);
55
+ }
56
+ }
57
+ if (enabledDatasets & EnabledDatasets.DosLeg) {
58
+ try {
59
+ await convertDatasetDosLeg(dataDir, options);
60
+ const doslegDir = path.join(dataDir, datasets.dosleg.database);
61
+ exitCode = commitGit(doslegDir, options, exitCode);
62
+ }
63
+ catch (error) {
64
+ console.error(`Error converting DosLeg dataset:`, error);
65
+ }
66
+ try {
67
+ await convertDatasetScrutins(dataDir, options);
68
+ const scrutinsDir = path.join(dataDir, SCRUTINS_FOLDER);
69
+ exitCode = commitGit(scrutinsDir, options, exitCode);
70
+ }
71
+ catch (error) {
72
+ console.error(`Error converting Scrutins dataset:`, error);
73
+ }
74
+ }
75
+ if (enabledDatasets & EnabledDatasets.Questions) {
76
+ try {
77
+ await convertDatasetQuestions(dataDir, options);
78
+ const questionsDir = path.join(dataDir, datasets.questions.database);
79
+ exitCode = commitGit(questionsDir, options, exitCode);
80
+ }
81
+ catch (error) {
82
+ console.error(`Error converting Questions dataset:`, error);
83
+ }
84
+ }
85
+ if (enabledDatasets & EnabledDatasets.Sens) {
86
+ try {
87
+ await convertDatasetSens(dataDir, options);
88
+ const sensDir = path.join(dataDir, datasets.sens.database);
89
+ exitCode = commitGit(sensDir, options, exitCode);
90
+ }
91
+ catch (error) {
92
+ console.error(`Error converting Sens dataset:`, error);
93
+ }
94
+ }
95
+ if (!options["silent"]) {
96
+ console.timeEnd("data transformation time");
97
+ }
98
+ return exitCode;
99
+ }
100
+ async function convertDatasetAmeli(dataDir, options) {
101
+ const dataset = datasets.ameli;
102
+ if (!options["silent"]) {
103
+ console.log(`Converting database ${dataset.database} data into files…`);
104
+ }
105
+ const ameliReorganizedRootDir = path.join(dataDir, dataset.database);
106
+ if (!options.keepDir) {
107
+ ensureAndClearDir(ameliReorganizedRootDir);
108
+ }
109
+ for await (const amendement of findAllAmendements(options["fromSession"])) {
110
+ if (options["verbose"]) {
111
+ console.log(`Converting ${amendement["numero"]} file…`);
112
+ }
113
+ const session = String(amendement["session"]) || UNDEFINED_SESSION;
114
+ const signetDossierLegislatif = amendement["signet_dossier_legislatif"] ||
115
+ `${amendement["nature_texte"]}-${amendement["numero_texte"]}`.toLowerCase();
116
+ const amendementFileName = `${amendement["numero"]}.json`;
117
+ const filePath = path.join(ameliReorganizedRootDir, String(session), signetDossierLegislatif, amendementFileName);
118
+ await fs.outputJSON(filePath, amendement, { spaces: 2 });
119
+ }
120
+ }
121
+ async function convertDatasetDebats(dataDir, options) {
122
+ const dataset = datasets.debats;
123
+ if (!options["silent"]) {
124
+ console.log(`Converting database ${dataset.database} data into files…`);
125
+ }
126
+ const debatsReorganizedRootDir = path.join(dataDir, dataset.database);
127
+ if (!options.keepDir) {
128
+ ensureAndClearDir(debatsReorganizedRootDir);
129
+ }
130
+ for await (const debat of findAllDebats()) {
131
+ if (options["verbose"]) {
132
+ console.log(`Converting ${debat.id} file…`);
133
+ }
134
+ const session = getSessionFromDate(debat.date_seance);
135
+ if (options["fromSession"] && session < options["fromSession"]) {
136
+ continue;
137
+ }
138
+ const debatFileName = `${debat.id}.json`;
139
+ const filePath = path.join(debatsReorganizedRootDir, String(session), debatFileName);
140
+ await fs.outputJSON(filePath, debat, { spaces: 2 });
141
+ }
142
+ }
143
+ async function convertDatasetDosLeg(dataDir, options) {
144
+ const dataset = datasets.dosleg;
145
+ if (!options["silent"]) {
146
+ console.log(`Converting database ${dataset.database} data into files…`);
147
+ }
148
+ const doslegReorganizedRootDir = path.join(dataDir, dataset.database);
149
+ const dossiersReorganizedDir = path.join(doslegReorganizedRootDir, DOSLEG_DOSSIERS_FOLDER);
150
+ if (!options.keepDir) {
151
+ ensureAndClearDir(doslegReorganizedRootDir);
152
+ ensureAndClearDir(dossiersReorganizedDir);
153
+ }
154
+ for await (const dossier of findAllDossiers()) {
155
+ if (options["verbose"]) {
156
+ console.log(`Converting ${dossier["signet"]} file…`);
157
+ }
158
+ let dossierReorganizedDir = path.join(dossiersReorganizedDir, String(UNDEFINED_SESSION));
159
+ const session = getSessionFromSignet(dossier["signet"]) || UNDEFINED_SESSION;
160
+ if (options["fromSession"] && session < options["fromSession"]) {
161
+ continue;
162
+ }
163
+ dossierReorganizedDir = path.join(dossiersReorganizedDir, String(session));
164
+ const actesBrutsNormalises = buildActesLegislatifs(dossier);
165
+ const dossierWithActes = {
166
+ ...dossier,
167
+ actes_legislatifs: actesBrutsNormalises
168
+ };
169
+ const dossierFile = `${dossier["signet"]}.json`;
170
+ await fs.outputJSON(path.join(dossierReorganizedDir, dossierFile), dossierWithActes, { spaces: 2 });
171
+ }
172
+ await convertTextes(dataDir, options);
173
+ await convertRapports(dataDir, options);
174
+ }
175
+ async function convertDatasetScrutins(dataDir, options) {
176
+ const dataset = datasets.dosleg;
177
+ if (!options["silent"]) {
178
+ console.log(`Converting database scrutins (${dataset.database}) data into files…`);
179
+ }
180
+ const scrutinsReorganizedDir = path.join(dataDir, SCRUTINS_FOLDER);
181
+ if (!options.keepDir) {
182
+ ensureAndClearDir(scrutinsReorganizedDir);
183
+ }
184
+ for await (const scrutin of findAllScrutins(options["fromSession"])) {
185
+ if (options["verbose"]) {
186
+ console.log(`Converting ${scrutin["numero"]} file…`);
187
+ }
188
+ let scrutinReorganizedDir = path.join(scrutinsReorganizedDir, String(UNDEFINED_SESSION));
189
+ const session = scrutin["session"] || UNDEFINED_SESSION;
190
+ scrutinReorganizedDir = path.join(scrutinsReorganizedDir, String(session));
191
+ const scrutinFileName = `${scrutin["numero"]}.json`;
192
+ await fs.outputJSON(path.join(scrutinReorganizedDir, scrutinFileName), scrutin, {
193
+ spaces: 2,
194
+ });
195
+ }
196
+ }
197
+ async function convertDatasetQuestions(dataDir, options) {
198
+ const dataset = datasets.questions;
199
+ if (!options["silent"]) {
200
+ console.log(`Converting database ${dataset.database} data into files…`);
201
+ }
202
+ const questionsReorganizedRootDir = path.join(dataDir, dataset.database);
203
+ if (!options.keepDir) {
204
+ ensureAndClearDir(questionsReorganizedRootDir);
205
+ }
206
+ const limit = pLimit(10);
207
+ const tasks = [];
208
+ for await (const question of findAllQuestions()) {
209
+ tasks.push(limit(async () => {
210
+ if (options["verbose"]) {
211
+ console.log(`Converting ${question["reference"]} file…`);
212
+ }
213
+ const legislature = question["legislature"] ? question["legislature"] : 0;
214
+ const questionFileName = `${question["reference"]}.json`;
215
+ await fs.outputJSON(path.join(questionsReorganizedRootDir, String(legislature), questionFileName), question, {
216
+ spaces: 2,
217
+ });
218
+ }));
219
+ }
220
+ await Promise.all(tasks);
221
+ }
222
+ async function convertTextes(dataDir, options) {
223
+ const originalTextesDir = path.join(dataDir, TEXTE_FOLDER, DATA_ORIGINAL_FOLDER);
224
+ const transformedTextesDir = path.join(dataDir, TEXTE_FOLDER, DATA_TRANSFORMED_FOLDER);
225
+ if (!options["silent"]) {
226
+ console.log(`Converting database textes data into files…`);
227
+ }
228
+ for await (const texte of findAllTextes()) {
229
+ const session = texte["session"] ?? UNDEFINED_SESSION;
230
+ if (options["fromSession"] && session < options["fromSession"]) {
231
+ continue;
232
+ }
233
+ if (!texte["url"]) {
234
+ continue;
235
+ }
236
+ const texteName = path.parse(texte["url"]).name;
237
+ const texteDir = path.join(originalTextesDir, `${session}`, texteName);
238
+ // oritxtcod = 1 corresponds to "Texte de loi déposé au Sénat"
239
+ const hasExposeDesMotifs = texte["origine"] === 'Sénat' && texte["ordre_origine"] === '1';
240
+ const metadata = {
241
+ name: texteName,
242
+ session: texte["session"],
243
+ date: texte["date"],
244
+ url_expose_des_motifs: hasExposeDesMotifs
245
+ ? new URL(`${texteName}-expose.html`, SENAT_EXPOSE_DES_MOTIFS_BASE_URL)
246
+ : undefined,
247
+ url_xml: new URL(`${texteName}.akn.xml`, SENAT_TEXTE_XML_BASE_URL),
248
+ url_html: new URL(`${texteName}.html`, SENAT_TEXTE_BASE_URL),
249
+ url_pdf: new URL(`${texteName}.pdf`, SENAT_TEXTE_BASE_URL),
250
+ };
251
+ fs.outputJSONSync(path.join(texteDir, `${texteName}.json`), texte, {
252
+ spaces: 2,
253
+ });
254
+ fs.outputJSONSync(path.join(texteDir, DOCUMENT_METADATA_FILE), metadata, {
255
+ spaces: 2,
256
+ });
257
+ if (options.fetchDocuments) {
258
+ await processTexte(metadata, originalTextesDir, transformedTextesDir, options);
259
+ }
260
+ }
261
+ }
262
+ async function convertRapports(dataDir, options) {
263
+ const originalRapportsDir = path.join(dataDir, RAPPORT_FOLDER, DATA_ORIGINAL_FOLDER);
264
+ if (!options["silent"]) {
265
+ console.log(`Converting database rapports data into files…`);
266
+ }
267
+ for await (const rapport of findAllRapports()) {
268
+ const session = rapport["session"] ?? UNDEFINED_SESSION;
269
+ if (options["fromSession"] && session < options["fromSession"]) {
270
+ continue;
271
+ }
272
+ if (!rapport["url"]) {
273
+ continue;
274
+ }
275
+ const parsedRapportUrl = path.parse(rapport["url"]);
276
+ const rapportName = parsedRapportUrl.name;
277
+ const rapportDir = path.join(originalRapportsDir, `${session}`, rapportName);
278
+ const rapportHtmlUrlBase = `${rapportName}_mono.html`;
279
+ const rapportHtmlUrl = path.format({
280
+ dir: parsedRapportUrl.dir,
281
+ base: rapportHtmlUrlBase,
282
+ });
283
+ const rapportPdfUrlBase = `${rapportName}1.pdf`;
284
+ const rapportPdfUrl = path.format({
285
+ dir: parsedRapportUrl.dir,
286
+ base: rapportPdfUrlBase,
287
+ });
288
+ const metadata = {
289
+ name: rapportName,
290
+ session: rapport["session"],
291
+ date: rapport["date"],
292
+ url_html: new URL(rapportHtmlUrl, SENAT_RAPPORT_BASE_URL),
293
+ url_pdf: new URL(rapportPdfUrl, SENAT_RAPPORT_BASE_URL),
294
+ };
295
+ fs.outputJSONSync(path.join(rapportDir, `${rapportName}.json`), rapport, {
296
+ spaces: 2,
297
+ });
298
+ fs.outputJSONSync(path.join(rapportDir, DOCUMENT_METADATA_FILE), metadata, {
299
+ spaces: 2,
300
+ });
301
+ if (options.fetchDocuments) {
302
+ await processRapport(metadata, originalRapportsDir, options);
303
+ }
304
+ }
305
+ }
306
+ async function convertDatasetSens(dataDir, options) {
307
+ const dataset = datasets.sens;
308
+ if (!options["silent"]) {
309
+ console.log(`Converting database ${dataset.database} data into files…`);
310
+ }
311
+ const sensReorganizedRootDir = path.join(dataDir, dataset.database);
312
+ const senateursReorganizedDir = path.join(sensReorganizedRootDir, SENS_SENATEURS_FOLDER);
313
+ const circonscriptionsReorganizedDir = path.join(sensReorganizedRootDir, SENS_CIRCONSCRIPTIONS_FOLDER);
314
+ const organismesReorganizedDir = path.join(sensReorganizedRootDir, SENS_ORGANISMES_FOLDER);
315
+ if (!options.keepDir) {
316
+ ensureAndClearDir(sensReorganizedRootDir);
317
+ ensureAndClearDir(senateursReorganizedDir);
318
+ ensureAndClearDir(circonscriptionsReorganizedDir);
319
+ ensureAndClearDir(organismesReorganizedDir);
320
+ }
321
+ for await (const sen of findAllSens()) {
322
+ if (options["verbose"]) {
323
+ console.log(`Converting ${sen["matricule"]} file…`);
324
+ }
325
+ const senFileName = `${sen["matricule"]}.json`;
326
+ fs.outputJSONSync(path.join(senateursReorganizedDir, senFileName), sen, {
327
+ spaces: 2,
328
+ });
329
+ }
330
+ for await (const circonscription of findAllCirconscriptions()) {
331
+ if (options["verbose"]) {
332
+ console.log(`Converting ${circonscription["identifiant"]} file…`);
333
+ }
334
+ const circonscriptionFileName = `${circonscription["identifiant"]}.json`;
335
+ fs.outputJSONSync(path.join(circonscriptionsReorganizedDir, circonscriptionFileName), circonscription, {
336
+ spaces: 2,
337
+ });
338
+ }
339
+ for await (const organisme of findAllOrganismes()) {
340
+ if (options["verbose"]) {
341
+ console.log(`Converting ${organisme["code"]} file…`);
342
+ }
343
+ const organismeFileName = `${organisme["code"]}.json`;
344
+ fs.outputJSONSync(path.join(organismesReorganizedDir, organisme["type_code"], organismeFileName), organisme, {
345
+ spaces: 2,
346
+ });
347
+ }
348
+ }
349
+ convertData()
350
+ .then((exitCode) => process.exit(exitCode || 0))
351
+ .catch((error) => {
352
+ console.log(error);
353
+ process.exit(1);
354
+ });
@@ -0,0 +1,181 @@
1
+ import assert from "assert";
2
+ import commandLineArgs from "command-line-args";
3
+ import fs from "fs-extra";
4
+ import path from "path";
5
+ import { datasets, EnabledDatasets, getEnabledDatasets } from "../datasets";
6
+ import { DOCUMENT_METADATA_FILE, DOSLEG_DOSSIERS_FOLDER, RAPPORT_FOLDER, SENS_CIRCONSCRIPTIONS_FOLDER, SENS_ORGANISMES_FOLDER, SENS_SENATEURS_FOLDER, TEXTE_FOLDER, TEXTE_ORIGINAL_FOLDER, } from "../loaders";
7
+ import { findAllAmendements, findAllCirconscriptions, findAllLois, findAllOrganismes, findAllQuestions, findAllSens, } from "../model";
8
+ import { findSenatRapportUrls, findSenatTexteUrls } from "../model/dosleg";
9
+ import { formatToFourDigitSession, SIGNET_STRUCTURE_REGEXP, UNDEFINED_SESSION } from "./datautil";
10
+ import { commonOptions } from "./shared/cli_helpers";
11
+ import { ensureAndClearDir } from "./shared/util";
12
+ const optionsDefinitions = [
13
+ ...commonOptions,
14
+ ];
15
+ const options = commandLineArgs(optionsDefinitions);
16
+ const SENAT_TEXTE_XML_BASE_URL = "https://www.senat.fr/akomantoso/";
17
+ const SENAT_TEXTE_BASE_URL = "https://www.senat.fr/leg/";
18
+ const SENAT_EXPOSE_DES_MOTIFS_BASE_URL = "https://www.senat.fr/leg/exposes-des-motifs/";
19
+ const SENAT_RAPPORT_BASE_URL = "https://www.senat.fr/rap/";
20
+ async function convertData() {
21
+ const enabledDatasets = getEnabledDatasets(options.categories);
22
+ const dataDir = options.dataDir;
23
+ assert(dataDir, "Missing argument: data directory");
24
+ console.time("data transformation time");
25
+ if (enabledDatasets & EnabledDatasets.Ameli) {
26
+ const dataset = datasets.ameli;
27
+ if (!options.silent) {
28
+ console.log(`Converting database ${dataset.database} data into files…`);
29
+ }
30
+ const ameliReorganizedRootDir = path.join(dataDir, dataset.database);
31
+ ensureAndClearDir(ameliReorganizedRootDir);
32
+ for await (const amendement of findAllAmendements()) {
33
+ if (options.verbose) {
34
+ console.log(`Converting ${amendement.numero} file…`);
35
+ }
36
+ const session = String(amendement.session) || UNDEFINED_SESSION;
37
+ const signetDossierLegislatif = amendement.signet_dossier_legislatif
38
+ || `${amendement.nature_texte}-${amendement.numero_texte}`.toLowerCase();
39
+ const ameliReorganizedDir = path.join(ameliReorganizedRootDir, session, signetDossierLegislatif);
40
+ fs.ensureDirSync(ameliReorganizedDir);
41
+ const amendementFileName = `${amendement.numero}.json`;
42
+ fs.writeJSONSync(path.join(ameliReorganizedDir, amendementFileName), amendement, { spaces: 2 });
43
+ }
44
+ }
45
+ if (enabledDatasets & EnabledDatasets.DosLeg) {
46
+ const dataset = datasets.dosleg;
47
+ if (!options.silent) {
48
+ console.log(`Converting database ${dataset.database} data into files…`);
49
+ }
50
+ const doslegReorganizedRootDir = path.join(dataDir, dataset.database);
51
+ const dossiersReorganizedDir = path.join(doslegReorganizedRootDir, DOSLEG_DOSSIERS_FOLDER);
52
+ ensureAndClearDir(doslegReorganizedRootDir);
53
+ ensureAndClearDir(dossiersReorganizedDir);
54
+ for await (const loi of findAllLois()) {
55
+ if (options.verbose) {
56
+ console.log(`Converting ${loi.signet} file…`);
57
+ }
58
+ let loiReorganizedDir = path.join(dossiersReorganizedDir, UNDEFINED_SESSION);
59
+ const signetParts = SIGNET_STRUCTURE_REGEXP.exec(loi.signet)?.groups;
60
+ if (signetParts) {
61
+ const { session } = signetParts;
62
+ const formattedSession = formatToFourDigitSession(session);
63
+ loiReorganizedDir = path.join(dossiersReorganizedDir, formattedSession);
64
+ }
65
+ fs.ensureDirSync(loiReorganizedDir);
66
+ const loiFileName = `${loi.signet}.json`;
67
+ fs.writeJSONSync(path.join(loiReorganizedDir, loiFileName), loi, { spaces: 2 });
68
+ }
69
+ await convertTexteUrls(dataDir);
70
+ await convertRapportUrls(dataDir);
71
+ }
72
+ if (enabledDatasets & EnabledDatasets.Questions) {
73
+ const dataset = datasets.questions;
74
+ if (!options.silent) {
75
+ console.log(`Converting database ${dataset.database} data into files…`);
76
+ }
77
+ const questionsReorganizedRootDir = path.join(dataDir, dataset.database);
78
+ ensureAndClearDir(questionsReorganizedRootDir);
79
+ for await (const question of findAllQuestions()) {
80
+ if (options.verbose) {
81
+ console.log(`Converting ${question.reference} file…`);
82
+ }
83
+ const legislature = question.legislature ? question.legislature : 0;
84
+ const questionReorganizedDir = path.join(questionsReorganizedRootDir, String(legislature));
85
+ fs.ensureDirSync(questionReorganizedDir);
86
+ const questionFileName = `${question.reference}.json`;
87
+ fs.writeJSONSync(path.join(questionReorganizedDir, questionFileName), question, { spaces: 2 });
88
+ }
89
+ }
90
+ if (enabledDatasets & EnabledDatasets.Sens) {
91
+ const dataset = datasets.sens;
92
+ if (!options.silent) {
93
+ console.log(`Converting database ${dataset.database} data into files…`);
94
+ }
95
+ const sensReorganizedRootDir = path.join(dataDir, dataset.database);
96
+ const senateursReorganizedDir = path.join(sensReorganizedRootDir, SENS_SENATEURS_FOLDER);
97
+ const circonscriptionsReorganizedDir = path.join(sensReorganizedRootDir, SENS_CIRCONSCRIPTIONS_FOLDER);
98
+ const organismesReorganizedDir = path.join(sensReorganizedRootDir, SENS_ORGANISMES_FOLDER);
99
+ ensureAndClearDir(sensReorganizedRootDir);
100
+ ensureAndClearDir(senateursReorganizedDir);
101
+ ensureAndClearDir(circonscriptionsReorganizedDir);
102
+ ensureAndClearDir(organismesReorganizedDir);
103
+ for await (const sen of findAllSens()) {
104
+ if (options.verbose) {
105
+ console.log(`Converting ${sen.matricule} file…`);
106
+ }
107
+ const senFileName = `${sen.matricule}.json`;
108
+ fs.writeJSONSync(path.join(senateursReorganizedDir, senFileName), sen, { spaces: 2 });
109
+ }
110
+ for await (const circonscription of findAllCirconscriptions()) {
111
+ if (options.verbose) {
112
+ console.log(`Converting ${circonscription.identifiant} file…`);
113
+ }
114
+ const circonscriptionFileName = `${circonscription.identifiant}.json`;
115
+ fs.writeJSONSync(path.join(circonscriptionsReorganizedDir, circonscriptionFileName), circonscription, { spaces: 2 });
116
+ }
117
+ for await (const organisme of findAllOrganismes()) {
118
+ if (options.verbose) {
119
+ console.log(`Converting ${organisme.code} file…`);
120
+ }
121
+ const organismeFileName = `${organisme.code}.json`;
122
+ fs.writeJSONSync(path.join(organismesReorganizedDir, organismeFileName), organisme, { spaces: 2 });
123
+ }
124
+ }
125
+ if (!options.silent) {
126
+ console.timeEnd("data transformation time");
127
+ }
128
+ }
129
+ async function convertTexteUrls(dataDir) {
130
+ const textesDir = path.join(dataDir, TEXTE_FOLDER);
131
+ fs.ensureDirSync(textesDir);
132
+ const originalTextesDir = path.join(textesDir, TEXTE_ORIGINAL_FOLDER);
133
+ for await (const texte of findSenatTexteUrls(options.sessions)) {
134
+ const texteName = path.parse(texte.url).name;
135
+ const texteDir = path.join(originalTextesDir, `${texte.session ?? UNDEFINED_SESSION}`, texteName);
136
+ fs.ensureDirSync(texteDir);
137
+ const metadata = {
138
+ name: texteName,
139
+ session: texte.session,
140
+ url_expose_des_motifs: texte.hasExposeDesMotifs ?
141
+ new URL(`${texteName}-expose.html`, SENAT_EXPOSE_DES_MOTIFS_BASE_URL) : undefined,
142
+ url_xml: new URL(`${texteName}.akn.xml`, SENAT_TEXTE_XML_BASE_URL),
143
+ url_html: new URL(`${texteName}.html`, SENAT_TEXTE_BASE_URL),
144
+ url_pdf: new URL(`${texteName}.pdf`, SENAT_TEXTE_BASE_URL),
145
+ };
146
+ fs.writeJSONSync(path.join(texteDir, DOCUMENT_METADATA_FILE), metadata, { spaces: 2 });
147
+ }
148
+ }
149
+ async function convertRapportUrls(dataDir) {
150
+ const rapportsDir = path.join(dataDir, RAPPORT_FOLDER);
151
+ fs.ensureDirSync(rapportsDir);
152
+ for await (const rapport of findSenatRapportUrls(options.sessions)) {
153
+ const parsedRapportUrl = path.parse(rapport.url);
154
+ const rapportName = parsedRapportUrl.name;
155
+ const rapportDir = path.join(rapportsDir, `${rapport.session ?? UNDEFINED_SESSION}`, rapportName);
156
+ fs.ensureDirSync(rapportDir);
157
+ const rapportHtmlUrlBase = `${rapportName}_mono.html`;
158
+ const rapportHtmlUrl = path.format({
159
+ dir: parsedRapportUrl.dir,
160
+ base: rapportHtmlUrlBase,
161
+ });
162
+ const rapportPdfUrlBase = `${rapportName}1.pdf`;
163
+ const rapportPdfUrl = path.format({
164
+ dir: parsedRapportUrl.dir,
165
+ base: rapportPdfUrlBase,
166
+ });
167
+ const metadata = {
168
+ name: rapportName,
169
+ session: rapport.session,
170
+ url_html: new URL(rapportHtmlUrl, SENAT_RAPPORT_BASE_URL),
171
+ url_pdf: new URL(rapportPdfUrl, SENAT_RAPPORT_BASE_URL),
172
+ };
173
+ fs.writeJSONSync(path.join(rapportDir, DOCUMENT_METADATA_FILE), metadata, { spaces: 2 });
174
+ }
175
+ }
176
+ convertData()
177
+ .then(() => process.exit(0))
178
+ .catch((error) => {
179
+ console.log(error);
180
+ process.exit(1);
181
+ });