orbitkit 0.8.42__tar.gz → 0.8.44__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {orbitkit-0.8.42/orbitkit.egg-info → orbitkit-0.8.44}/PKG-INFO +1 -1
- orbitkit-0.8.44/orbitkit/VERSION +1 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/airflow_handler/file_flow_entry_process.py +4 -5
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/airflow_handler/file_flow_exit_process.py +3 -2
- {orbitkit-0.8.42 → orbitkit-0.8.44/orbitkit.egg-info}/PKG-INFO +1 -1
- orbitkit-0.8.42/orbitkit/VERSION +0 -1
- {orbitkit-0.8.42 → orbitkit-0.8.44}/LICENSE +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/MANIFEST.in +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/README.md +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/__init__.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/airflow_handler/__init__.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/airflow_handler/data_preprocessing.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/airflow_handler/file_handler.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/airflow_handler/file_handler_v2.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/audio_transcoder/__init__.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/audio_transcoder/netmind_extract_v1.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/constant/__init__.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/constant/report_schema.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/id_srv/__init__.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/id_srv/id_gen.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/id_srv/id_perm_like.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/lark_send/__init__.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/lark_send/lark.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/llm_tools/__init__.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/llm_tools/quick_rag_chat.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/orbit_type/__init__.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/orbit_type/doc_4_compile_rule.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/orbit_type/orbit_type_simple.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/orbit_type/tools.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_embedding/__init__.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_embedding/pdf_txt_embedding.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_embedding/pdf_txt_embedding_v2.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor/__init__.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor/a_stock_extractor_v1.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor/exceptions.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor/pdf_block_extractor_base.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor/pdf_block_extractor_v1.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor/pdf_block_extractor_v2.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor/pdf_extractor_azure.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor/pdf_extractor_minerU_v1.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor/pdf_extractor_netmind_v1.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor/pdf_extractor_netmind_v2.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor/pdf_extractor_netmind_v3.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor/pdf_extractor_orbit.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor_simple/__init__.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor_simple/base.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor_simple/cloud_provider.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor_simple/core.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor_simple/exceptions.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor_simple/extractors.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_extractor_simple/utils.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_writer/__init__.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/pdf_writer/pdf_writer_simple.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/__init__.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/cache_asset_downloader.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/common.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/customize_regix_manager.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/secret_manager.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/util_aliyun.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/util_aliyun_oss_simple.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/util_aws.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/util_aws_s3_wrapper.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/util_date.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/util_html.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/util_kafka.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/util_md5.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/util_selenium.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/util_simple_timer.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/util_str.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/util_type_mapping.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit/util/util_url.py +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit.egg-info/SOURCES.txt +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit.egg-info/dependency_links.txt +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit.egg-info/not-zip-safe +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit.egg-info/requires.txt +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/orbitkit.egg-info/top_level.txt +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/setup.cfg +0 -0
- {orbitkit-0.8.42 → orbitkit-0.8.44}/setup.py +0 -0
|
@@ -0,0 +1 @@
|
|
|
1
|
+
0.8.44
|
|
@@ -39,7 +39,6 @@ class FilingOfficialProcessor:
|
|
|
39
39
|
(self.filing_data_collection, 'filing_data')
|
|
40
40
|
]
|
|
41
41
|
}
|
|
42
|
-
self.only_low_important_set = {'internal_seekingalpha'}
|
|
43
42
|
postgres_uri = os.environ.get('PG_URI_AIRFLOW12_USER_NEWSFEEDSITE') if not postgres_uri else postgres_uri
|
|
44
43
|
if not postgres_uri:
|
|
45
44
|
raise KeyError('postgres_uri not set.')
|
|
@@ -136,10 +135,10 @@ class FilingOfficialProcessor:
|
|
|
136
135
|
for step_info, records in file_flow_info.items():
|
|
137
136
|
for record in records:
|
|
138
137
|
if 'extends' in record and record.get('extends') is not None:
|
|
139
|
-
tickers =
|
|
138
|
+
tickers = set()
|
|
140
139
|
for i in record['extends']['perm_id_list']:
|
|
141
|
-
tickers.
|
|
142
|
-
record['extends']['tickers'] = tickers
|
|
140
|
+
tickers.update(orbit_entity_id_ticker_map.get(i, []))
|
|
141
|
+
record['extends']['tickers'] = list(tickers)
|
|
143
142
|
|
|
144
143
|
record['extends']['report_type_id_list_str'] = [self.report_type_id_name_map.get(i) for i in record['extends']['report_type_id_list_str']]
|
|
145
144
|
|
|
@@ -158,7 +157,7 @@ class FilingOfficialProcessor:
|
|
|
158
157
|
f"{len(records)}--{start_stage}-{target_stage}-{x_spider_name} status: False, message: 'File has already completed the embedding stage.' ")
|
|
159
158
|
continue
|
|
160
159
|
|
|
161
|
-
if is_important
|
|
160
|
+
if is_important:
|
|
162
161
|
logger.info(f"is_important: {is_important} - {x_spider_name}")
|
|
163
162
|
status, ids, message = self.file_handler.entry_point_urgent(records=records, start_stage=start_stage,
|
|
164
163
|
target_stage=target_stage,
|
|
@@ -28,8 +28,6 @@ class FlowUpdater:
|
|
|
28
28
|
return getattr(self, collection_name)
|
|
29
29
|
|
|
30
30
|
def _handle_convert(self, status, attachments, db_store_path_set, attachments_pdf):
|
|
31
|
-
if not attachments or not attachments_pdf:
|
|
32
|
-
raise ValueError("Missing attachments: neither 'attachments' nor 'attachments_pdf' was provided.")
|
|
33
31
|
if not status:
|
|
34
32
|
return {
|
|
35
33
|
'x_status_list.status_convert.status': 'convert_failed',
|
|
@@ -37,6 +35,9 @@ class FlowUpdater:
|
|
|
37
35
|
'x_status_list.status_convert.status_meta': 'meta_init'
|
|
38
36
|
}
|
|
39
37
|
|
|
38
|
+
if not attachments or not attachments_pdf:
|
|
39
|
+
raise ValueError("Missing attachments: neither 'attachments' nor 'attachments_pdf' was provided.")
|
|
40
|
+
|
|
40
41
|
store_path_set = set()
|
|
41
42
|
parent_id_store_path_map = {i['parent_id']: i['store_path'] for i in attachments_pdf}
|
|
42
43
|
x_attachments_pdf = []
|
orbitkit-0.8.42/orbitkit/VERSION
DELETED
|
@@ -1 +0,0 @@
|
|
|
1
|
-
0.8.42
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|