mdbq 1.7.4__py3-none-any.whl → 1.7.6__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- mdbq/aggregation/aggregation.py +26 -8
- mdbq/aggregation/query_data.py +2 -2
- mdbq/clean/data_clean.py +24 -0
- {mdbq-1.7.4.dist-info → mdbq-1.7.6.dist-info}/METADATA +1 -1
- {mdbq-1.7.4.dist-info → mdbq-1.7.6.dist-info}/RECORD +7 -7
- {mdbq-1.7.4.dist-info → mdbq-1.7.6.dist-info}/WHEEL +1 -1
- {mdbq-1.7.4.dist-info → mdbq-1.7.6.dist-info}/top_level.txt +0 -0
mdbq/aggregation/aggregation.py
CHANGED
@@ -189,6 +189,24 @@ class DatabaseUpdate:
|
|
189
189
|
collection_name='店铺来源_日数据_旧版'
|
190
190
|
elif name.endswith('.csv') and '客户运营平台_客户列表' in name:
|
191
191
|
df = pd.read_csv(os.path.join(root, name), encoding=encoding, header=0, na_filter=False)
|
192
|
+
elif name.endswith('.xls') and '生意参谋' in name and '无线店铺三级流量来源详情' in name:
|
193
|
+
# 店铺来源,手淘搜索,关键词
|
194
|
+
pattern = re.findall(r'(\d{4}-\d{2}-\d{2})_(\d{4}-\d{2}-\d{2})', name)
|
195
|
+
df = pd.read_excel(os.path.join(root, name), header=5)
|
196
|
+
if len(df) == 0:
|
197
|
+
print(f'{name} 报表数据为空')
|
198
|
+
continue
|
199
|
+
df.replace(to_replace=[','], value='', regex=True, inplace=True)
|
200
|
+
df.insert(loc=0, column='日期', value=pattern[0][1])
|
201
|
+
df.rename(columns={
|
202
|
+
'来源名称': '关键词',
|
203
|
+
'收藏商品-支付买家数': '收藏商品_支付买家数',
|
204
|
+
'加购商品-支付买家数': '加购商品_支付买家数',
|
205
|
+
}, inplace=True)
|
206
|
+
if pattern[0][0] != pattern[0][1]:
|
207
|
+
data_lis = pattern[0][0] + '_' + pattern[0][1]
|
208
|
+
df.insert(loc=1, column='数据周期', value=data_lis)
|
209
|
+
|
192
210
|
elif name.endswith('.xls') and '生意参谋' in name and '商品_全部' in name:
|
193
211
|
# 店铺商品排行
|
194
212
|
df = pd.read_excel(os.path.join(root, name), header=4)
|
@@ -1082,12 +1100,12 @@ if __name__ == '__main__':
|
|
1082
1100
|
# database='mysql'
|
1083
1101
|
# )
|
1084
1102
|
|
1085
|
-
db_name = '推广数据2'
|
1086
|
-
table_name = '超级直播'
|
1087
|
-
upload_dir(
|
1088
|
-
|
1089
|
-
|
1090
|
-
|
1091
|
-
|
1092
|
-
)
|
1103
|
+
# db_name = '推广数据2'
|
1104
|
+
# table_name = '超级直播'
|
1105
|
+
# upload_dir(
|
1106
|
+
# path='/Users/xigua/数据中心/原始文件2/推广报表/超级直播',
|
1107
|
+
# db_name=db_name,
|
1108
|
+
# collection_name=table_name,
|
1109
|
+
# dbs={'mysql': True, 'mongodb': False},
|
1110
|
+
# )
|
1093
1111
|
|
mdbq/aggregation/query_data.py
CHANGED
@@ -1351,9 +1351,9 @@ def data_aggregation(service_databases=[{}], months=1):
|
|
1351
1351
|
df=df,
|
1352
1352
|
db_name=db_name,
|
1353
1353
|
table_name=table_name,
|
1354
|
-
df_sql=True,
|
1354
|
+
# df_sql=True,
|
1355
1355
|
drop_duplicates=False,
|
1356
|
-
|
1356
|
+
icm_update=unique_key_list,
|
1357
1357
|
service_database=service_database,
|
1358
1358
|
) # 3. 回传数据库
|
1359
1359
|
res = g.performance(bb_tg=True) # 盈亏表,依赖其他表,单独做
|
mdbq/clean/data_clean.py
CHANGED
@@ -298,6 +298,27 @@ class DataClean:
|
|
298
298
|
m.df_to_mysql(df=df, db_name='生意参谋2', tabel_name='生意参谋_店铺来源_日数据_旧版')
|
299
299
|
os.remove(os.path.join(root, name))
|
300
300
|
|
301
|
+
elif name.endswith('.xls') and '生意参谋' in name and '无线店铺三级流量来源详情' in name:
|
302
|
+
# 店铺来源,手淘搜索,关键词
|
303
|
+
pattern = re.findall(r'(\d{4}-\d{2}-\d{2})_(\d{4}-\d{2}-\d{2})', name)
|
304
|
+
df = pd.read_excel(os.path.join(root, name), header=5)
|
305
|
+
if len(df) == 0:
|
306
|
+
print(f'{name} 报表数据为空')
|
307
|
+
continue
|
308
|
+
df.replace(to_replace=[','], value='', regex=True, inplace=True)
|
309
|
+
df.insert(loc=0, column='日期', value=pattern[0][1])
|
310
|
+
df.rename(columns={
|
311
|
+
'来源名称': '关键词',
|
312
|
+
'收藏商品-支付买家数': '收藏商品_支付买家数',
|
313
|
+
'加购商品-支付买家数': '加购商品_支付买家数',
|
314
|
+
}, inplace=True)
|
315
|
+
if pattern[0][0] != pattern[0][1]:
|
316
|
+
data_lis = pattern[0][0] + '_' + pattern[0][1]
|
317
|
+
df.insert(loc=1, column='数据周期', value=data_lis)
|
318
|
+
new_name = os.path.splitext(name)[0] + '.csv'
|
319
|
+
self.save_to_csv(df, root, new_name) # mysql 可能改变 df 列名,所以在上传 mysql 前保存 csv
|
320
|
+
os.remove(os.path.join(root, name))
|
321
|
+
|
301
322
|
elif name.endswith('.xls') and '生意参谋' in name and '商品_全部' in name:
|
302
323
|
# 店铺商品排行
|
303
324
|
new_name = os.path.splitext(name)[0] + '.csv'
|
@@ -1055,6 +1076,9 @@ class DataClean:
|
|
1055
1076
|
else:
|
1056
1077
|
t_path = str(pathlib.Path(self.source_path, '生意参谋/流量来源_旧版'))
|
1057
1078
|
bib(t_path, _as_month=True)
|
1079
|
+
elif name.endswith('.csv') and '生意参谋' in name and '无线店铺三级流量来源详情' in name:
|
1080
|
+
t_path = str(pathlib.Path(self.source_path, '生意参谋/手淘搜索来源'))
|
1081
|
+
bib(t_path, _as_month=True)
|
1058
1082
|
elif name.endswith('.csv') and '商品_全部' in name:
|
1059
1083
|
t_path = str(pathlib.Path(self.source_path, '生意参谋/商品排行'))
|
1060
1084
|
bib(t_path, _as_month=True)
|
@@ -1,15 +1,15 @@
|
|
1
1
|
mdbq/__init__.py,sha256=Il5Q9ATdX8yXqVxtP_nYqUhExzxPC_qk_WXQ_4h0exg,16
|
2
2
|
mdbq/__version__.py,sha256=y9Mp_8x0BCZSHsdLT_q5tX9wZwd5QgqrSIENLrb6vXA,62
|
3
3
|
mdbq/aggregation/__init__.py,sha256=EeDqX2Aml6SPx8363J-v1lz0EcZtgwIBYyCJV6CcEDU,40
|
4
|
-
mdbq/aggregation/aggregation.py,sha256=
|
4
|
+
mdbq/aggregation/aggregation.py,sha256=d7pYUku7Wbxl0tvKKNTG7mppOjGqg0LF62OpfW8fVBk,64120
|
5
5
|
mdbq/aggregation/df_types.py,sha256=oQJS2IBU3_IO6GMgbssHuC2yCjNnbta0QPGrFOwNLnU,7591
|
6
6
|
mdbq/aggregation/mysql_types.py,sha256=DQYROALDiwjJzjhaJfIIdnsrNs11i5BORlj_v6bp67Y,11062
|
7
7
|
mdbq/aggregation/optimize_data.py,sha256=u2Kl_MFtZueXJ57ycy4H2OhXD431RctUYJYCl637uT0,4176
|
8
|
-
mdbq/aggregation/query_data.py,sha256=
|
8
|
+
mdbq/aggregation/query_data.py,sha256=WxLtzR6s6gIPe6e1hB3xycZirrN83IZ0s0PyI0t2Cls,66792
|
9
9
|
mdbq/bdup/__init__.py,sha256=AkhsGk81SkG1c8FqDH5tRq-8MZmFobVbN60DTyukYTY,28
|
10
10
|
mdbq/bdup/bdup.py,sha256=LAV0TgnQpc-LB-YuJthxb0U42_VkPidzQzAagan46lU,4234
|
11
11
|
mdbq/clean/__init__.py,sha256=A1d6x3L27j4NtLgiFV5TANwEkLuaDfPHDQNrPBbNWtU,41
|
12
|
-
mdbq/clean/data_clean.py,sha256=
|
12
|
+
mdbq/clean/data_clean.py,sha256=T0WYOKFwNZTNk3temKOw1K2H54kxu9QBJjlTbkMtxNk,94217
|
13
13
|
mdbq/company/__init__.py,sha256=qz8F_GsP_pMB5PblgJAUAMjasuZbOEp3qQOCB39E8f0,21
|
14
14
|
mdbq/company/copysh.py,sha256=WCZ92vCJAy6_ZFeOxWL-U9gArIpyga4xts-s1wKsspY,17268
|
15
15
|
mdbq/config/__init__.py,sha256=jso1oHcy6cJEfa7udS_9uO5X6kZLoPBF8l3wCYmr5dM,18
|
@@ -35,7 +35,7 @@ mdbq/pbix/__init__.py,sha256=Trtfaynu9RjoTyLLYBN2xdRxTvm_zhCniUkVTAYwcjo,24
|
|
35
35
|
mdbq/pbix/pbix_refresh.py,sha256=JUjKW3bNEyoMVfVfo77UhguvS5AWkixvVhDbw4_MHco,2396
|
36
36
|
mdbq/pbix/refresh_all.py,sha256=tgy762608HMaXWynbOURIf2UVMuSPybzrDXQnOOcnZU,6102
|
37
37
|
mdbq/spider/__init__.py,sha256=RBMFXGy_jd1HXZhngB2T2XTvJqki8P_Fr-pBcwijnew,18
|
38
|
-
mdbq-1.7.
|
39
|
-
mdbq-1.7.
|
40
|
-
mdbq-1.7.
|
41
|
-
mdbq-1.7.
|
38
|
+
mdbq-1.7.6.dist-info/METADATA,sha256=QzujGJTSxIt0YV7h24bB6lTwt0Tw7QNStfyJncdGqxY,245
|
39
|
+
mdbq-1.7.6.dist-info/WHEEL,sha256=cpQTJ5IWu9CdaPViMhC9YzF8gZuS5-vlfoFihTBC86A,91
|
40
|
+
mdbq-1.7.6.dist-info/top_level.txt,sha256=2FQ-uLnCSB-OwFiWntzmwosW3X2Xqsg0ewh1axsaylA,5
|
41
|
+
mdbq-1.7.6.dist-info/RECORD,,
|
File without changes
|