datamule 2.1.0__tar.gz → 2.1.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {datamule-2.1.0 → datamule-2.1.2}/PKG-INFO +1 -1
- {datamule-2.1.0 → datamule-2.1.2}/datamule/datamule/datamule_mysql_rds.py +3 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/datamule/downloader.py +5 -1
- {datamule-2.1.0 → datamule-2.1.2}/datamule/document/document.py +2 -2
- {datamule-2.1.0 → datamule-2.1.2}/datamule/mapping_dicts/html_mapping_dicts.py +2 -2
- {datamule-2.1.0 → datamule-2.1.2}/datamule/submission.py +6 -6
- {datamule-2.1.0 → datamule-2.1.2}/datamule.egg-info/PKG-INFO +1 -1
- {datamule-2.1.0 → datamule-2.1.2}/setup.py +1 -1
- {datamule-2.1.0 → datamule-2.1.2}/datamule/__init__.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/config.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/data/listed_filer_metadata.csv +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/datamule/__init__.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/datamule/datamule_lookup.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/datamule/sec_connector.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/document/__init__.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/document/tables/__init__.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/document/tables/tables.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/document/tables/tables_13fhr.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/document/tables/tables_25nse.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/document/tables/tables_informationtable.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/document/tables/tables_npx.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/document/tables/tables_ownership.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/document/tables/tables_proxyvotingrecord.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/document/tables/tables_sbsef.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/document/tables/tables_sdr.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/document/tables/utils.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/helper.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/index.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/mapping_dicts/__init__.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/mapping_dicts/txt_mapping_dicts.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/mapping_dicts/xml_mapping_dicts.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/package_updater.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/portfolio.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/portfolio_compression_utils.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/__init__.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/infrastructure/__init__.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/infrastructure/submissions_metadata.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/submissions/__init__.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/submissions/downloader.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/submissions/eftsquery.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/submissions/monitor.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/submissions/streamer.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/submissions/textsearch.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/utils.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/xbrl/__init__.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/xbrl/downloadcompanyfacts.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/xbrl/filter_xbrl.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/xbrl/streamcompanyfacts.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sec/xbrl/xbrlmonitor.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/seclibrary/__init__.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/seclibrary/bq.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/sheet.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/utils/__init__.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/utils/construct_submissions_data.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule/utils/format_accession.py +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule.egg-info/SOURCES.txt +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule.egg-info/dependency_links.txt +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule.egg-info/requires.txt +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/datamule.egg-info/top_level.txt +0 -0
- {datamule-2.1.0 → datamule-2.1.2}/setup.cfg +0 -0
@@ -71,6 +71,9 @@ class DatamuleMySQL:
|
|
71
71
|
database = 'npx_db'
|
72
72
|
elif table == 'information_table':
|
73
73
|
database = '13fhr_db'
|
74
|
+
elif table in ['derivative_holding_ownership','derivative_transaction_ownership', 'metadata_ownership','non_derivative_holding_ownership',
|
75
|
+
'non_derivative_transaction_ownership','owner_signature_ownership','reporting_owner_ownership']:
|
76
|
+
database = 'ownership_db'
|
74
77
|
else:
|
75
78
|
raise ValueError(f"Unsupported table: {table}")
|
76
79
|
|
@@ -23,7 +23,11 @@ from ..utils.format_accession import format_accession
|
|
23
23
|
# could be cleaned up
|
24
24
|
|
25
25
|
# Set up logging
|
26
|
-
logging.basicConfig(
|
26
|
+
logging.basicConfig(
|
27
|
+
level=logging.INFO,
|
28
|
+
format='%(asctime)s - %(levelname)s - %(message)s',
|
29
|
+
handlers=logging.getLogger().handlers,
|
30
|
+
)
|
27
31
|
logger = logging.getLogger(__name__)
|
28
32
|
|
29
33
|
|
@@ -315,11 +315,11 @@ class Document:
|
|
315
315
|
else:
|
316
316
|
visualize_dict(self.data)
|
317
317
|
|
318
|
-
def get_section(self, title, format='dict'):
|
318
|
+
def get_section(self, title=None, title_regex=None,title_class=None, format='dict'):
|
319
319
|
if not self.data:
|
320
320
|
self.parse()
|
321
321
|
|
322
|
-
result = get_title(self.data,title)
|
322
|
+
result = get_title(self.data,title=title,title_regex=title_regex,title_class=title_class)
|
323
323
|
|
324
324
|
if format == 'text':
|
325
325
|
result = [item[1] for item in result]
|
@@ -1,7 +1,7 @@
|
|
1
1
|
dict_10k_html = {
|
2
2
|
('part',r'^part\s*([ivx]+)$') : 0,
|
3
3
|
('signatures',r'^signatures?\.*$') : 0,
|
4
|
-
('item',r'^item\s*(\d+)\.?([a-z])?') : 1,
|
4
|
+
('item',r'^item\s*(\d+)\.?([a-z])?(?![a-z])') : 1,
|
5
5
|
}
|
6
6
|
dict_10q_html = dict_10k_html
|
7
7
|
|
@@ -48,7 +48,7 @@ dict_10d_html = dict_10k_html
|
|
48
48
|
|
49
49
|
dict_20f_html = {
|
50
50
|
('part',r'^part\s*([ivx]+)') : 0,
|
51
|
-
('item',r'^item\s*(\d+)\.?([a-z])?') : 1,
|
51
|
+
('item',r'^item\s*(\d+)\.?([a-z])?(?![a-z])') : 1,
|
52
52
|
('letter',r'\d*\.?([a-z])') : 2,
|
53
53
|
('signatures',r'^signatures?\.*$') : 0,
|
54
54
|
}
|
@@ -163,8 +163,8 @@ class Submission:
|
|
163
163
|
content = zstd.ZstdDecompressor().decompress(content)
|
164
164
|
|
165
165
|
# Decode text files
|
166
|
-
if extension in ['.htm', '.html', '.txt', '.xml']:
|
167
|
-
|
166
|
+
# if extension in ['.htm', '.html', '.txt', '.xml']:
|
167
|
+
# content = content.decode('utf-8', errors='replace')
|
168
168
|
|
169
169
|
document_path = f"{self.batch_tar_path}::{self.accession_prefix}/{filename}"
|
170
170
|
|
@@ -197,8 +197,8 @@ class Submission:
|
|
197
197
|
content = zstd.ZstdDecompressor().decompress(content)
|
198
198
|
|
199
199
|
# Decode text files
|
200
|
-
if extension in ['.htm', '.html', '.txt', '.xml']:
|
201
|
-
|
200
|
+
# if extension in ['.htm', '.html', '.txt', '.xml']:
|
201
|
+
# content = content.decode('utf-8', errors='replace')
|
202
202
|
|
203
203
|
document_path = f"{self.path}::{actual_filename}"
|
204
204
|
|
@@ -219,8 +219,8 @@ class Submission:
|
|
219
219
|
content = zstd.ZstdDecompressor().decompress(content)
|
220
220
|
|
221
221
|
# Decode text files
|
222
|
-
if extension in ['.htm', '.html', '.txt', '.xml']:
|
223
|
-
|
222
|
+
# if extension in ['.htm', '.html', '.txt', '.xml']:
|
223
|
+
# content = content.decode('utf-8', errors='replace')
|
224
224
|
|
225
225
|
return Document(
|
226
226
|
type=doc['type'],
|
@@ -32,7 +32,7 @@ if not os.path.exists(file_path):
|
|
32
32
|
setup(
|
33
33
|
name="datamule",
|
34
34
|
author="John Friedman",
|
35
|
-
version="2.1.
|
35
|
+
version="2.1.2",
|
36
36
|
description="Work with SEC submissions at scale.",
|
37
37
|
packages=find_packages(include=['datamule', 'datamule.*']),
|
38
38
|
url="https://github.com/john-friedman/datamule-python",
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|