datamule 2.0.1__py3-none-any.whl → 2.0.3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- datamule/datamule/downloader.py +3 -3
- datamule/document/document.py +1 -0
- datamule/submission.py +18 -0
- {datamule-2.0.1.dist-info → datamule-2.0.3.dist-info}/METADATA +1 -1
- {datamule-2.0.1.dist-info → datamule-2.0.3.dist-info}/RECORD +7 -7
- {datamule-2.0.1.dist-info → datamule-2.0.3.dist-info}/WHEEL +0 -0
- {datamule-2.0.1.dist-info → datamule-2.0.3.dist-info}/top_level.txt +0 -0
datamule/datamule/downloader.py
CHANGED
@@ -311,11 +311,11 @@ class Downloader:
|
|
311
311
|
columns=['accessionNumber'], distinct=True, page_size=25000, quiet=False,api_key=self.api_key)
|
312
312
|
|
313
313
|
if filtered_accession_numbers:
|
314
|
-
filtered_accession_numbers = [
|
314
|
+
filtered_accession_numbers = [format_accession(item,'int') for item in filtered_accession_numbers]
|
315
315
|
filings = [filing for filing in filings if filing['accessionNumber'] in filtered_accession_numbers]
|
316
316
|
|
317
317
|
if skip_accession_numbers:
|
318
|
-
skip_accession_numbers = [
|
318
|
+
skip_accession_numbers = [format_accession(item,'int') for item in skip_accession_numbers]
|
319
319
|
filings = [filing for filing in filings if filing['accessionNumber'] not in skip_accession_numbers]
|
320
320
|
|
321
321
|
logger.debug(f"Generating URLs for {len(filings)} filings...")
|
@@ -394,7 +394,7 @@ def download(submission_type=None, cik=None, filing_date=None, api_key=None, out
|
|
394
394
|
skip_accession_numbers=[], max_batch_size=1024*1024*1024,accession_numbers=None):
|
395
395
|
|
396
396
|
if filtered_accession_numbers:
|
397
|
-
filtered_accession_numbers = [
|
397
|
+
filtered_accession_numbers = [format_accession(x,'int') for x in filtered_accession_numbers]
|
398
398
|
elif filtered_accession_numbers == []:
|
399
399
|
raise ValueError("Applied filter resulted in empty accession numbers list")
|
400
400
|
downloader = Downloader(api_key=api_key)
|
datamule/document/document.py
CHANGED
datamule/submission.py
CHANGED
@@ -14,6 +14,10 @@ class Submission:
|
|
14
14
|
def __init__(self, path=None, sgml_content=None, keep_document_types=None,
|
15
15
|
batch_tar_path=None, accession_prefix=None, portfolio_ref=None,url=None):
|
16
16
|
|
17
|
+
|
18
|
+
# declare vars to be filled later
|
19
|
+
self.xbrl = None
|
20
|
+
|
17
21
|
# Validate parameters
|
18
22
|
param_count = sum(x is not None for x in [path, sgml_content, batch_tar_path,url])
|
19
23
|
if param_count != 1:
|
@@ -238,4 +242,18 @@ class Submission:
|
|
238
242
|
if doc['type'] in document_types:
|
239
243
|
yield self._load_document_by_index(idx)
|
240
244
|
|
245
|
+
# def parse_xbrl(self):
|
246
|
+
# for idx, doc in enumerate(self.metadata.content['documents']):
|
247
|
+
# if doc['type'] in ['EX-100.INS','EX-101.INS']:
|
248
|
+
# document = self._load_document_by_index(idx)
|
249
|
+
# break
|
241
250
|
|
251
|
+
# if doc['filename'].endswith('_htm.xml'):
|
252
|
+
# document = self._load_document_by_index(idx)
|
253
|
+
# break
|
254
|
+
|
255
|
+
# print(doc['type'])
|
256
|
+
# if not document:
|
257
|
+
# return
|
258
|
+
|
259
|
+
# self.xbrl = document.parse_xbrl()
|
@@ -6,15 +6,15 @@ datamule/package_updater.py,sha256=Z9zaa_y0Z5cknpRn8oPea3gg4kquFHfpfhduKKCZ6NU,9
|
|
6
6
|
datamule/portfolio.py,sha256=YViG1JgJ9SFhg8N3tOOhBI8oc6Pmi2vwnHeHmlkC_5U,12119
|
7
7
|
datamule/portfolio_compression_utils.py,sha256=8OPYEN5zAdV1FiTxgVN3S7cTKs99Elv74bwgoIJP4QY,12654
|
8
8
|
datamule/sheet.py,sha256=Ws_YRtpvewLVioarngVMe8cgG_sp11MP9_goGbRaiWE,23952
|
9
|
-
datamule/submission.py,sha256=
|
9
|
+
datamule/submission.py,sha256=DtLoiwRE7JJW2R0NvJNyQfwstWIlU2N9Z6yOgpnH1LU,11812
|
10
10
|
datamule/data/listed_filer_metadata.csv,sha256=dT9fQ8AC5P1-Udf_UF0ZkdXJ88jNxJb_tuhi5YYL1rc,2426827
|
11
11
|
datamule/datamule/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
12
12
|
datamule/datamule/datamule_lookup.py,sha256=e8djAg-ctSyHiKk7BjbtgugZ3p8roUjzsym5z3AihUg,9468
|
13
13
|
datamule/datamule/datamule_mysql_rds.py,sha256=Oj_xPTBKkzWsuRlb_tphjJrBW1eua1cOuxjGwJx581k,10591
|
14
|
-
datamule/datamule/downloader.py,sha256=
|
14
|
+
datamule/datamule/downloader.py,sha256=aTyVUuIwynPtHB0Z9BvCasy9Ao5wfHptNAsjN-7yDTk,18525
|
15
15
|
datamule/datamule/sec_connector.py,sha256=VwOaODpHoAWy8JIky6kLR1-orW_PB61RHw7pIGRpkow,3288
|
16
16
|
datamule/document/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
17
|
-
datamule/document/document.py,sha256=
|
17
|
+
datamule/document/document.py,sha256=8UC5QfiMDufkA7v3o76mlfftqsUjNUFWKB3j894tsKw,16795
|
18
18
|
datamule/document/processing.py,sha256=jDCEzBFDSQtq7nQxRScIsbALnFcvMPOkNkMUCa7mFxg,31921
|
19
19
|
datamule/document/table.py,sha256=73yUJKY82ap32jhLmZeTti-jQ_lyhcJGlGwyxLtgYOg,12944
|
20
20
|
datamule/document/mappings/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
@@ -65,7 +65,7 @@ datamule/seclibrary/bq.py,sha256=C8sb_rpXTvchprrFLcbRar4Qi0XWW25tnv1YsHSS5o4,180
|
|
65
65
|
datamule/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
66
66
|
datamule/utils/construct_submissions_data.py,sha256=NB_hvfxlRXPyt4Fgc-5qA8vJRItkLhBedCSTaxwW7Jg,5887
|
67
67
|
datamule/utils/format_accession.py,sha256=60RtqoNqoT9zSKVb1DeOv1gncJxzPTFMNW4SNOVmC_g,476
|
68
|
-
datamule-2.0.
|
69
|
-
datamule-2.0.
|
70
|
-
datamule-2.0.
|
71
|
-
datamule-2.0.
|
68
|
+
datamule-2.0.3.dist-info/METADATA,sha256=xILAQeqGiaZbF19rqWWRoFqBLv1to0a3RdRFKdhlu0Q,560
|
69
|
+
datamule-2.0.3.dist-info/WHEEL,sha256=oiQVh_5PnQM0E3gPdiz09WCNmwiHDMaGer_elqB3coM,92
|
70
|
+
datamule-2.0.3.dist-info/top_level.txt,sha256=iOfgmtSMFVyr7JGl_bYSTDry79JbmsG4p8zKq89ktKk,9
|
71
|
+
datamule-2.0.3.dist-info/RECORD,,
|
File without changes
|
File without changes
|