mdbq 1.4.3__tar.gz → 1.4.5__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {mdbq-1.4.3 → mdbq-1.4.5}/PKG-INFO +1 -1
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/aggregation/aggregation.py +37 -11
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/aggregation/optimize_data.py +1 -1
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/clean/data_clean.py +3 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/company/copysh.py +1 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq.egg-info/PKG-INFO +1 -1
- {mdbq-1.4.3 → mdbq-1.4.5}/setup.py +1 -1
- {mdbq-1.4.3 → mdbq-1.4.5}/README.txt +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/__init__.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/__version__.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/aggregation/__init__.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/aggregation/df_types.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/aggregation/mysql_types.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/aggregation/query_data.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/bdup/__init__.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/bdup/bdup.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/clean/__init__.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/company/__init__.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/config/__init__.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/config/get_myconf.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/config/products.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/config/set_support.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/config/update_conf.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/dataframe/__init__.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/dataframe/converter.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/log/__init__.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/log/mylogger.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/mongo/__init__.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/mongo/mongo.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/mysql/__init__.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/mysql/mysql.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/mysql/s_query.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/mysql/year_month_day.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/other/__init__.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/other/porxy.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/other/pov_city.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/other/ua_sj.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/pbix/__init__.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/pbix/pbix_refresh.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/pbix/refresh_all.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq/spider/__init__.py +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq.egg-info/SOURCES.txt +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq.egg-info/dependency_links.txt +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/mdbq.egg-info/top_level.txt +0 -0
- {mdbq-1.4.3 → mdbq-1.4.5}/setup.cfg +0 -0
@@ -366,6 +366,8 @@ class DatabaseUpdate:
|
|
366
366
|
df = pd.read_csv(os.path.join(root, name), encoding='utf-8_sig', header=0, na_filter=False)
|
367
367
|
elif name.endswith('.csv') and '类目洞察_价格分析_分析明细_汇总' in name:
|
368
368
|
df = pd.read_csv(os.path.join(root, name), encoding='utf-8_sig', header=0, na_filter=False)
|
369
|
+
elif name.endswith('.csv') and '搜索排行_搜索' in name:
|
370
|
+
df = pd.read_csv(os.path.join(root, name), encoding='utf-8_sig', header=0, na_filter=False)
|
369
371
|
elif name.endswith('.csv') and '竞店分析-销售分析-关键指标对比' in name:
|
370
372
|
df = pd.read_csv(os.path.join(root, name), encoding='utf-8_sig', header=0, na_filter=False)
|
371
373
|
elif name.endswith('.csv') and '竞店分析-销售分析-top商品榜' in name:
|
@@ -592,15 +594,15 @@ class DatabaseUpdate:
|
|
592
594
|
if is_move:
|
593
595
|
os.remove(os.path.join(root, name))
|
594
596
|
|
595
|
-
df = self.date_table() # 创建一个日期表
|
596
|
-
self.datas.append(
|
597
|
-
|
598
|
-
|
599
|
-
|
600
|
-
|
601
|
-
|
602
|
-
|
603
|
-
)
|
597
|
+
# df = self.date_table() # 创建一个日期表
|
598
|
+
# self.datas.append(
|
599
|
+
# {
|
600
|
+
# '数据库名': '聚合数据',
|
601
|
+
# '集合名称': '日期表',
|
602
|
+
# '数据主体': df,
|
603
|
+
# '文件名': '日期表文件名',
|
604
|
+
# }
|
605
|
+
# )
|
604
606
|
|
605
607
|
def upload_df(self, service_databases=[{}], path=None, system_name=None):
|
606
608
|
"""
|
@@ -631,6 +633,8 @@ class DatabaseUpdate:
|
|
631
633
|
is_file_dtype=True, # 默认本地文件优先: True
|
632
634
|
)
|
633
635
|
d.df_to_mongo(df=df, db_name=db_name, collection_name=collection_name)
|
636
|
+
if d.client:
|
637
|
+
d.client.close()
|
634
638
|
|
635
639
|
elif database == 'mysql':
|
636
640
|
username, password, host, port = get_myconf.select_config_values(
|
@@ -780,7 +784,7 @@ class DatabaseUpdate:
|
|
780
784
|
encod = chardet.detect(f1).get('encoding')
|
781
785
|
return encod
|
782
786
|
|
783
|
-
def date_table(self):
|
787
|
+
def date_table(self, service_databases=[{}]):
|
784
788
|
"""
|
785
789
|
生成 pbix使用的日期表
|
786
790
|
"""
|
@@ -805,7 +809,29 @@ class DatabaseUpdate:
|
|
805
809
|
df['索引'] = p
|
806
810
|
df['月索引'] = mon
|
807
811
|
df.sort_values('日期', ascending=False, ignore_index=True, inplace=True)
|
808
|
-
|
812
|
+
|
813
|
+
for service_database in service_databases:
|
814
|
+
for service_name, database in service_database.items():
|
815
|
+
username, password, host, port = get_myconf.select_config_values(
|
816
|
+
target_service=service_name,
|
817
|
+
database=database,
|
818
|
+
)
|
819
|
+
m = mysql.MysqlUpload(
|
820
|
+
username=username,
|
821
|
+
password=password,
|
822
|
+
host=host,
|
823
|
+
port=port,
|
824
|
+
)
|
825
|
+
m.df_to_mysql(
|
826
|
+
df=df,
|
827
|
+
db_name=db_name,
|
828
|
+
table_name=collection_name,
|
829
|
+
df_sql=False, # 值为 True 时使用 df.to_sql 函数上传整个表, 不会排重
|
830
|
+
drop_dup=True, # 值为 True 时检查重复数据再插入,反之直接上传,会比较慢
|
831
|
+
filename=None, # 用来追踪处理进度
|
832
|
+
system_name=service_name, # 用来追踪处理进度
|
833
|
+
)
|
834
|
+
# return df
|
809
835
|
|
810
836
|
|
811
837
|
def upload_dir(path, db_name, collection_name, dbs={'mysql': True, 'mongodb': True}, json_path=None, system_name=None):
|
@@ -1046,6 +1046,9 @@ class DataClean:
|
|
1046
1046
|
elif name.endswith('.csv') and '类目洞察' in name and '价格分析_分析明细_商品发现' in name:
|
1047
1047
|
t_path = str(pathlib.Path(self.source_path, '市场数据/类目洞察/价格分析/商品发现'))
|
1048
1048
|
bib(t_path, _as_month=True)
|
1049
|
+
elif name.endswith('.csv') and '搜索排行_搜索' in name:
|
1050
|
+
t_path = str(pathlib.Path(self.source_path, '市场数据/搜索排行'))
|
1051
|
+
bib(t_path, _as_month=True)
|
1049
1052
|
elif name.endswith('.csv') and '市场排行_店铺排行' in name:
|
1050
1053
|
t_path = str(pathlib.Path(self.source_path, '市场数据/市场二级类目店铺'))
|
1051
1054
|
bib(t_path, _as_month=True)
|
@@ -347,6 +347,7 @@ def main():
|
|
347
347
|
dp.new_unzip(is_move=True)
|
348
348
|
dp.cleaning(is_move=True) # 公司台式机需要移除自身下载的文件
|
349
349
|
dp.upload_df(service_databases=[{'company': 'mysql'}], system_name='company')
|
350
|
+
dp.date_table(service_databases=[{'company': 'mysql'}]) # 因为日期表不受 days 参数控制,因此单独更新日期表
|
350
351
|
|
351
352
|
# 此操作用于修改 .copysh_conf 文件,将 ch_record 改为 false (更新完成)
|
352
353
|
w = update_conf.UpdateConf()
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|