datamule 1.5.0__tar.gz → 1.5.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {datamule-1.5.0 → datamule-1.5.2}/PKG-INFO +1 -1
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/document.py +2 -1
- {datamule-1.5.0 → datamule-1.5.2}/datamule/mapping_dicts/html_mapping_dicts.py +35 -1
- {datamule-1.5.0 → datamule-1.5.2}/datamule/portfolio.py +2 -1
- {datamule-1.5.0 → datamule-1.5.2}/datamule.egg-info/PKG-INFO +1 -1
- {datamule-1.5.0 → datamule-1.5.2}/setup.py +1 -1
- {datamule-1.5.0 → datamule-1.5.2}/datamule/__init__.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/config.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/data/listed_filer_metadata.csv +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/__init__.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/__init__.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/atsn.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/cfportal.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/d.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/ex102_abs.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/ex99a_sdr.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/ex99c_sdr.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/ex99g_sdr.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/ex99i_sdr.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/information_table.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/nmfp.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/npx.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/onefourtyfour.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/ownership.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/proxy_voting_record.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/sbs.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/sbsef.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/schedule13.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/sdr.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/submission_metadata.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/ta.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/thirteenfhr.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/twentyfivense.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/mappings/twentyfourf2nt.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/processing.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/document/table.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/helper.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/index.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/mapping_dicts/__init__.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/mapping_dicts/txt_mapping_dicts.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/mapping_dicts/xml_mapping_dicts.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/package_updater.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/__init__.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/infrastructure/__init__.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/infrastructure/submissions_metadata.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/submissions/__init__.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/submissions/downloader.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/submissions/eftsquery.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/submissions/monitor.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/submissions/streamer.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/submissions/textsearch.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/utils.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/xbrl/__init__.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/xbrl/downloadcompanyfacts.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/xbrl/filter_xbrl.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/xbrl/streamcompanyfacts.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sec/xbrl/xbrlmonitor.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/seclibrary/__init__.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/seclibrary/bq.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/seclibrary/downloader.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/seclibrary/query.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/sheet.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule/submission.py +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule.egg-info/SOURCES.txt +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule.egg-info/dependency_links.txt +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule.egg-info/requires.txt +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/datamule.egg-info/top_level.txt +0 -0
- {datamule-1.5.0 → datamule-1.5.2}/setup.cfg +0 -0
@@ -194,7 +194,8 @@ class Document:
|
|
194
194
|
|
195
195
|
elif self.type == 'SD':
|
196
196
|
mapping_dict = dict_sd_html
|
197
|
-
|
197
|
+
elif self.type == 'S-1':
|
198
|
+
mapping_dict = dict_s1_html
|
198
199
|
elif self.type == 'T-3':
|
199
200
|
mapping_dict = dict_t3_html
|
200
201
|
elif self.type in ['NT 10-K', 'NT 10-Q','NT 20-F']:
|
@@ -118,4 +118,38 @@ dict_t3_html = {('general',r'^general'):0,
|
|
118
118
|
('capital securities',r'^capital securities'):0,
|
119
119
|
('indenture securities',r'^indenture securities'):0,
|
120
120
|
('signatures',r'^signatures?\.*$') : 0,
|
121
|
-
('number',r'^(\d+)') : 1,}
|
121
|
+
('number',r'^(\d+)') : 1,}
|
122
|
+
|
123
|
+
# NOTE THAT THIS IS INCOMPLETE - feel free to update it with more sections.
|
124
|
+
# I made a basic mapping due to user requests.
|
125
|
+
dict_s1_html ={
|
126
|
+
('signatures',r'^signatures?\.*$') : 0,
|
127
|
+
('mda',r'^management.?s\s+discussion'): 0,
|
128
|
+
('risk factors', r'^risk\s+factors') : 0,
|
129
|
+
('executive compensation', r'^executive\s+compensation') : 0,
|
130
|
+
('underwriting', r'^underwriting') : 0,
|
131
|
+
('legal matters', r'^legal\s+matters') : 0,
|
132
|
+
('prospectus summary', r'^prospectus\s+summary') : 0,
|
133
|
+
('use of proceeds', r'^use\s+of\s+proceeds') : 0,
|
134
|
+
('forward looking statements', r'forward-\?\s+looking\s+statements') : 0,
|
135
|
+
('dividend policy', r'^dividend\s+policy') : 0,
|
136
|
+
('capitalization', r'^capitalization') : 0,
|
137
|
+
('business', r'^business') : 0,
|
138
|
+
('management', r'^management\s+$') : 0,
|
139
|
+
('certain relationships', r'^certain\s+relationships') : 0,
|
140
|
+
('principal stockholders', r'^principal\b.*?\bstockholders\b') : 0,
|
141
|
+
('description of capital stock', r'^description\s+of\s+capital\s+stock') : 0,
|
142
|
+
('shares eligible for future sale', r'^shares\s+eligible\s+for\s+future\s+sale') : 0,
|
143
|
+
('federal income tax considerations for non us holders', r'^material\s+u\.s\.\s+federal\s+income\s+tax\s+considerations\s+for\s+non-u\.s\.\s+holders') : 0,
|
144
|
+
('where you can find more information', r'^where\s+you\s+can\s+find\s+more\s+information') : 0,
|
145
|
+
('index to financial statements', r'^index\b.*?\bfinancial\s+statements') : 0,
|
146
|
+
('dilution', r'^dilution') : 0,
|
147
|
+
('selling security holders', r'^selling\s+security\s+holders') : 0,
|
148
|
+
('plan of distribution', r'^plan\s+of\s+distribution') : 0,
|
149
|
+
('legal proceedings', r'^legal\s+proceedings') : 0,
|
150
|
+
('selected financial data', r'^selected\s+financial\s+data') : 0,
|
151
|
+
('market risk', r'^(?:quantitative\s+and\s+qualitative\s+disclosures\s+about\s+)?market\s+risk') : 0,
|
152
|
+
('property', r'^properties?$') : 0,
|
153
|
+
('controls and procedures', r'^(?:disclosure\s+)?controls\s+and\s+procedures') : 0,
|
154
|
+
('corporate governance', r'^corporate\s+governance') : 0,
|
155
|
+
}
|
@@ -33,7 +33,8 @@ class Portfolio:
|
|
33
33
|
self.api_key = api_key
|
34
34
|
|
35
35
|
def _load_submissions(self):
|
36
|
-
folders = [f for f in self.path.iterdir() if f.is_dir()]
|
36
|
+
folders = [f for f in self.path.iterdir() if f.is_dir() or f.suffix=='.tar']
|
37
|
+
print(folders)
|
37
38
|
print(f"Loading {len(folders)} submissions")
|
38
39
|
|
39
40
|
def load_submission(folder):
|
@@ -32,7 +32,7 @@ if not os.path.exists(file_path):
|
|
32
32
|
setup(
|
33
33
|
name="datamule",
|
34
34
|
author="John Friedman",
|
35
|
-
version="1.5.
|
35
|
+
version="1.5.2",
|
36
36
|
description="Work with SEC submissions at scale.",
|
37
37
|
packages=find_packages(include=['datamule', 'datamule.*']),
|
38
38
|
url="https://github.com/john-friedman/datamule-python",
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|