datamule 1.4.0__tar.gz → 1.4.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {datamule-1.4.0 → datamule-1.4.2}/PKG-INFO +1 -1
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/document.py +4 -3
- {datamule-1.4.0 → datamule-1.4.2}/datamule.egg-info/PKG-INFO +1 -1
- {datamule-1.4.0 → datamule-1.4.2}/setup.py +1 -1
- {datamule-1.4.0 → datamule-1.4.2}/datamule/__init__.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/config.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/data/listed_filer_metadata.csv +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/__init__.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/__init__.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/atsn.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/cfportal.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/d.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/ex102_abs.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/ex99a_sdr.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/ex99c_sdr.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/ex99g_sdr.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/ex99i_sdr.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/information_table.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/nmfp.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/npx.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/onefourtyfour.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/ownership.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/proxy_voting_record.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/sbs.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/sbsef.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/schedule13.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/sdr.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/submission_metadata.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/ta.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/thirteenfhr.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/twentyfivense.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/mappings/twentyfourf2nt.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/processing.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/document/table.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/helper.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/index.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/mapping_dicts/__init__.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/mapping_dicts/html_mapping_dicts.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/mapping_dicts/txt_mapping_dicts.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/mapping_dicts/xml_mapping_dicts.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/package_updater.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/portfolio.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/__init__.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/infrastructure/__init__.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/infrastructure/submissions_metadata.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/submissions/__init__.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/submissions/downloader.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/submissions/eftsquery.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/submissions/monitor.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/submissions/streamer.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/submissions/textsearch.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/utils.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/xbrl/__init__.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/xbrl/downloadcompanyfacts.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/xbrl/filter_xbrl.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/xbrl/streamcompanyfacts.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sec/xbrl/xbrlmonitor.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/seclibrary/__init__.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/seclibrary/bq.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/seclibrary/downloader.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/seclibrary/query.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/sheet.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule/submission.py +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule.egg-info/SOURCES.txt +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule.egg-info/dependency_links.txt +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule.egg-info/requires.txt +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/datamule.egg-info/top_level.txt +0 -0
- {datamule-1.4.0 → datamule-1.4.2}/setup.cfg +0 -0
@@ -3,7 +3,7 @@ import csv
|
|
3
3
|
import re
|
4
4
|
from doc2dict import xml2dict, txt2dict, dict2dict
|
5
5
|
from doc2dict.mapping import flatten_hierarchy
|
6
|
-
from doc2dict import html2dict, visualize_dict, get_title, unnest_dict
|
6
|
+
from doc2dict import html2dict, visualize_dict, get_title, unnest_dict, pdf2dict
|
7
7
|
from ..mapping_dicts.txt_mapping_dicts import dict_10k, dict_10q, dict_8k, dict_13d, dict_13g
|
8
8
|
from ..mapping_dicts.xml_mapping_dicts import dict_345
|
9
9
|
from ..mapping_dicts.html_mapping_dicts import dict_10k_html, dict_10q_html, dict_8k_html
|
@@ -134,6 +134,8 @@ class Document:
|
|
134
134
|
mapping_dict = dict_345
|
135
135
|
|
136
136
|
self.data = xml2dict(content=self.content, mapping_dict=mapping_dict)
|
137
|
+
elif self.extension == '.pdf':
|
138
|
+
self.data = pdf2dict(content=self.content, mapping_dict=mapping_dict)
|
137
139
|
else:
|
138
140
|
pass
|
139
141
|
|
@@ -235,8 +237,7 @@ class Document:
|
|
235
237
|
return result
|
236
238
|
|
237
239
|
|
238
|
-
#
|
239
|
-
# candidate for deletion
|
240
|
+
# TODO CHANGE THIS
|
240
241
|
def __iter__(self):
|
241
242
|
self.parse()
|
242
243
|
|
@@ -32,7 +32,7 @@ if not os.path.exists(file_path):
|
|
32
32
|
setup(
|
33
33
|
name="datamule",
|
34
34
|
author="John Friedman",
|
35
|
-
version="1.4.
|
35
|
+
version="1.4.2",
|
36
36
|
description="Work with SEC submissions at scale.",
|
37
37
|
packages=find_packages(include=['datamule', 'datamule.*']),
|
38
38
|
url="https://github.com/john-friedman/datamule-python",
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|