mdbq 1.6.5__py3-none-any.whl → 1.6.7__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- mdbq/aggregation/query_data.py +6 -1
- mdbq/clean/data_clean.py +2 -2
- {mdbq-1.6.5.dist-info → mdbq-1.6.7.dist-info}/METADATA +1 -1
- {mdbq-1.6.5.dist-info → mdbq-1.6.7.dist-info}/RECORD +6 -6
- {mdbq-1.6.5.dist-info → mdbq-1.6.7.dist-info}/WHEEL +0 -0
- {mdbq-1.6.5.dist-info → mdbq-1.6.7.dist-info}/top_level.txt +0 -0
mdbq/aggregation/query_data.py
CHANGED
@@ -237,7 +237,6 @@ class MysqlDatasQuery:
|
|
237
237
|
columns_name=['日期', '商品id', '商品白底图', '方版场景图'],
|
238
238
|
)
|
239
239
|
df = pd.DataFrame(data=data_values)
|
240
|
-
|
241
240
|
return df
|
242
241
|
|
243
242
|
def dplyd(self):
|
@@ -747,6 +746,8 @@ class GroupBy:
|
|
747
746
|
df = df[['商品id', '商品图片', '日期']]
|
748
747
|
df['商品图片'] = df['商品图片'].apply(lambda x: x if 'http' in x else None) # 检查是否是 http 链接
|
749
748
|
df.dropna(how='all', subset=['商品图片'], axis=0, inplace=True) # 删除指定列含有空值的行
|
749
|
+
df['商品链接'] = df['商品id'].apply(
|
750
|
+
lambda x: f'https://detail.tmall.com/item.htm?id={str(x)}' if x and '.com' not in str(x) else x)
|
750
751
|
df.sort_values(by='商品id', ascending=False, ignore_index=True, inplace=True) # ascending=False 降序排列
|
751
752
|
self.data_tgyj.update(
|
752
753
|
{
|
@@ -1166,6 +1167,10 @@ def data_aggregation(service_databases=[{}], months=1):
|
|
1166
1167
|
# optimize_data.op_data(service_databases=service_databases, days=3650) # 立即启动对聚合数据的清理工作
|
1167
1168
|
|
1168
1169
|
|
1170
|
+
def main():
|
1171
|
+
pass
|
1172
|
+
|
1173
|
+
|
1169
1174
|
if __name__ == '__main__':
|
1170
1175
|
data_aggregation(service_databases=[{'company': 'mysql'}], months=1) # 正常的聚合所有数据
|
1171
1176
|
# data_aggregation_one(service_databases=[{'home_lx': 'mysql'}], months=1) # 单独聚合某一个数据库,具体库进函数编辑
|
mdbq/clean/data_clean.py
CHANGED
@@ -88,7 +88,7 @@ class DataClean:
|
|
88
88
|
continue
|
89
89
|
encoding = self.get_encoding(file_path=pathlib.Path(root, name))
|
90
90
|
# ----------------- 推广报表 分割线 -----------------
|
91
|
-
tg_names = ['
|
91
|
+
tg_names = ['营销场景报表', '计划报表', '单元报表', '关键词报表', '人群报表', '主体报表',
|
92
92
|
'其他主体报表',
|
93
93
|
'创意报表', '地域报表', '权益报表']
|
94
94
|
for tg_name in tg_names:
|
@@ -135,7 +135,7 @@ class DataClean:
|
|
135
135
|
tm_s_name = pattern[0] + shop_name + date_min + date_max
|
136
136
|
new_root_p = pathlib.Path(self.source_path, '推广报表', tg_name) # 文件夹,未包括文件名
|
137
137
|
df['日期'] = pd.to_datetime(df['日期'], format='%Y-%m-%d', errors='ignore')
|
138
|
-
if '省' in df.columns.tolist() and '场景名字' in df.columns.tolist():
|
138
|
+
if '省' in df.columns.tolist() and '场景名字' in df.columns.tolist() and '完整' in name:
|
139
139
|
new_root_p = pathlib.Path(self.source_path, '推广报表', f'完整_{tg_name}')
|
140
140
|
tm_s_name = f'完整_{tm_s_name}'
|
141
141
|
self.save_to_csv(df, new_root_p, tm_s_name)
|
@@ -5,11 +5,11 @@ mdbq/aggregation/aggregation.py,sha256=mPKSiLsJXBPbDYsTso0VmDybinewFRs3z6uiA5Gqs
|
|
5
5
|
mdbq/aggregation/df_types.py,sha256=oQJS2IBU3_IO6GMgbssHuC2yCjNnbta0QPGrFOwNLnU,7591
|
6
6
|
mdbq/aggregation/mysql_types.py,sha256=DQYROALDiwjJzjhaJfIIdnsrNs11i5BORlj_v6bp67Y,11062
|
7
7
|
mdbq/aggregation/optimize_data.py,sha256=u2Kl_MFtZueXJ57ycy4H2OhXD431RctUYJYCl637uT0,4176
|
8
|
-
mdbq/aggregation/query_data.py,sha256=
|
8
|
+
mdbq/aggregation/query_data.py,sha256=EpPkFxeQK4o--GncY3UWiOQHhlfzxHTQ2Q41pDCFwWE,56409
|
9
9
|
mdbq/bdup/__init__.py,sha256=AkhsGk81SkG1c8FqDH5tRq-8MZmFobVbN60DTyukYTY,28
|
10
10
|
mdbq/bdup/bdup.py,sha256=LAV0TgnQpc-LB-YuJthxb0U42_VkPidzQzAagan46lU,4234
|
11
11
|
mdbq/clean/__init__.py,sha256=A1d6x3L27j4NtLgiFV5TANwEkLuaDfPHDQNrPBbNWtU,41
|
12
|
-
mdbq/clean/data_clean.py,sha256=
|
12
|
+
mdbq/clean/data_clean.py,sha256=H2YEYv6sOObJJQ7vTllipYON88DIag23yU76OShMsss,90987
|
13
13
|
mdbq/company/__init__.py,sha256=qz8F_GsP_pMB5PblgJAUAMjasuZbOEp3qQOCB39E8f0,21
|
14
14
|
mdbq/company/copysh.py,sha256=WCZ92vCJAy6_ZFeOxWL-U9gArIpyga4xts-s1wKsspY,17268
|
15
15
|
mdbq/config/__init__.py,sha256=jso1oHcy6cJEfa7udS_9uO5X6kZLoPBF8l3wCYmr5dM,18
|
@@ -35,7 +35,7 @@ mdbq/pbix/__init__.py,sha256=Trtfaynu9RjoTyLLYBN2xdRxTvm_zhCniUkVTAYwcjo,24
|
|
35
35
|
mdbq/pbix/pbix_refresh.py,sha256=JUjKW3bNEyoMVfVfo77UhguvS5AWkixvVhDbw4_MHco,2396
|
36
36
|
mdbq/pbix/refresh_all.py,sha256=tgy762608HMaXWynbOURIf2UVMuSPybzrDXQnOOcnZU,6102
|
37
37
|
mdbq/spider/__init__.py,sha256=RBMFXGy_jd1HXZhngB2T2XTvJqki8P_Fr-pBcwijnew,18
|
38
|
-
mdbq-1.6.
|
39
|
-
mdbq-1.6.
|
40
|
-
mdbq-1.6.
|
41
|
-
mdbq-1.6.
|
38
|
+
mdbq-1.6.7.dist-info/METADATA,sha256=o2jm_V-u-2jgbCRBpTdjUIvfP2LBJi5K8-Twdp_Sf70,245
|
39
|
+
mdbq-1.6.7.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
|
40
|
+
mdbq-1.6.7.dist-info/top_level.txt,sha256=2FQ-uLnCSB-OwFiWntzmwosW3X2Xqsg0ewh1axsaylA,5
|
41
|
+
mdbq-1.6.7.dist-info/RECORD,,
|
File without changes
|
File without changes
|