mdbq 1.4.7__py3-none-any.whl → 1.4.9__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1032,12 +1032,12 @@ if __name__ == '__main__':
1032
1032
 
1033
1033
  # test2()
1034
1034
 
1035
- # file = ''
1036
- # df = pd.read_csv(file, encoding='utf-8_sig', header=0, na_filter=False)
1037
- # username, password, host, port = get_myconf.select_config_values(target_service='company', database='mysql')
1038
- # m = mysql.MysqlUpload(username=username, password=password, host=host, port=port)
1039
- # m.df_to_mysql(df=df, db_name='test', table_name='增量更新测试',
1040
- # drop_duplicates=True,
1041
- # # icm_update=['日期', '推广费余额'],
1042
- # system_name='company',
1043
- # )
1035
+ file = ''
1036
+ df = pd.read_csv(file, encoding='utf-8_sig', header=0, na_filter=False)
1037
+ username, password, host, port = get_myconf.select_config_values(target_service='company', database='mysql')
1038
+ m = mysql.MysqlUpload(username=username, password=password, host=host, port=port)
1039
+ m.df_to_mysql(df=df, db_name='市场数据2', table_name='搜索排行',
1040
+ drop_duplicates=True,
1041
+ # icm_update=['日期', '推广费余额'],
1042
+ system_name='company',
1043
+ )
@@ -349,9 +349,60 @@ class GroupBy:
349
349
  }
350
350
  )
351
351
  return df
352
- elif '店铺来源_日数据' in table_name:
352
+ elif '店铺来源_日数据' in table_name and '旧版' not in table_name:
353
+ # 包含三级来源名称和预设索引值列
354
+ # 截取 从上月1日 至 今天的花费数据, 推广款式按此数据从高到低排序(商品图+排序)
355
+ df_visitor3 = df.groupby(['日期', '三级来源'], as_index=False).agg({'访客数': 'sum'})
356
+ df_visitor3 = df_visitor3[~df_visitor3['三级来源'].isin([''])] # 指定列中删除包含空值的行
357
+ # df_visitor = df_visitor[(df_visitor['日期'] >= f'{year_my}-{last_month.month}-01')]
358
+ df_visitor3 = df_visitor3.groupby(['三级来源'], as_index=False).agg({'访客数': 'sum'})
359
+ df_visitor3.sort_values('访客数', ascending=False, ignore_index=True, inplace=True)
360
+ df_visitor3.reset_index(inplace=True)
361
+ df_visitor3['index'] = df_visitor3['index'] + 100
362
+ df_visitor3.rename(columns={'index': '三级访客索引'}, inplace=True)
363
+ df_visitor3 = df_visitor3[['三级来源', '三级访客索引']]
364
+
365
+ # 包含二级来源名称和预设索引值列
366
+ df_visitor2 = df.groupby(['日期', '二级来源'], as_index=False).agg({'访客数': 'sum'})
367
+ df_visitor2 = df_visitor2[~df_visitor2['二级来源'].isin([''])] # 指定列中删除包含空值的行
368
+ # df_visitor2 = df_visitor2[(df_visitor2['日期'] >= f'{year_my}-{last_month.month}-01')]
369
+ df_visitor2 = df_visitor2.groupby(['二级来源'], as_index=False).agg({'访客数': 'sum'})
370
+ df_visitor2.sort_values('访客数', ascending=False, ignore_index=True, inplace=True)
371
+ df_visitor2.reset_index(inplace=True)
372
+ df_visitor2['index'] = df_visitor2['index'] + 100
373
+ df_visitor2.rename(columns={'index': '二级访客索引'}, inplace=True)
374
+ df_visitor2 = df_visitor2[['二级来源', '二级访客索引']]
375
+
376
+ df = pd.merge(df, df_visitor2, how='left', left_on='二级来源', right_on='二级来源')
377
+ df = pd.merge(df, df_visitor3, how='left', left_on='三级来源', right_on='三级来源')
353
378
  return df
354
- elif '店铺来源_日数据_旧版' in table_name:
379
+ elif '天猫_店铺来源_日数据_旧版' in table_name:
380
+
381
+ # 包含三级来源名称和预设索引值列
382
+ # 截取 从上月1日 至 今天的花费数据, 推广款式按此数据从高到低排序(商品图+排序)
383
+ df_visitor3 = df.groupby(['日期', '三级来源'], as_index=False).agg({'访客数': 'sum'})
384
+ df_visitor3 = df_visitor3[~df_visitor3['三级来源'].isin([''])] # 指定列中删除包含空值的行
385
+ # df_visitor = df_visitor[(df_visitor['日期'] >= f'{year_my}-{last_month.month}-01')]
386
+ df_visitor3 = df_visitor3.groupby(['三级来源'], as_index=False).agg({'访客数': 'sum'})
387
+ df_visitor3.sort_values('访客数', ascending=False, ignore_index=True, inplace=True)
388
+ df_visitor3.reset_index(inplace=True)
389
+ df_visitor3['index'] = df_visitor3['index'] + 100
390
+ df_visitor3.rename(columns={'index': '三级访客索引'}, inplace=True)
391
+ df_visitor3 = df_visitor3[['三级来源', '三级访客索引']]
392
+
393
+ # 包含二级来源名称和预设索引值列
394
+ df_visitor2 = df.groupby(['日期', '二级来源'], as_index=False).agg({'访客数': 'sum'})
395
+ df_visitor2 = df_visitor2[~df_visitor2['二级来源'].isin([''])] # 指定列中删除包含空值的行
396
+ # df_visitor2 = df_visitor2[(df_visitor2['日期'] >= f'{year_my}-{last_month.month}-01')]
397
+ df_visitor2 = df_visitor2.groupby(['二级来源'], as_index=False).agg({'访客数': 'sum'})
398
+ df_visitor2.sort_values('访客数', ascending=False, ignore_index=True, inplace=True)
399
+ df_visitor2.reset_index(inplace=True)
400
+ df_visitor2['index'] = df_visitor2['index'] + 100
401
+ df_visitor2.rename(columns={'index': '二级访客索引'}, inplace=True)
402
+ df_visitor2 = df_visitor2[['二级来源', '二级访客索引']]
403
+
404
+ df = pd.merge(df, df_visitor2, how='left', left_on='二级来源', right_on='二级来源')
405
+ df = pd.merge(df, df_visitor3, how='left', left_on='三级来源', right_on='三级来源')
355
406
  return df
356
407
  elif '商品id编码表' in table_name:
357
408
  df['宝贝id'] = df['宝贝id'].astype(str)
@@ -542,6 +593,12 @@ def data_aggregation_one(service_databases=[{}], months=1, system_name=None,):
542
593
  # 从数据库中获取数据, 返回包含 df 数据的字典
543
594
  # 单独处理某一个聚合数据库,在这里修改添加 data_dict 的值
544
595
  data_dict = [
596
+ {
597
+ '数据库名': '聚合数据',
598
+ '集合名': '天猫_店铺来源_日数据_旧版',
599
+ '唯一主键': ['日期', '一级来源', '二级来源', '三级来源'],
600
+ '数据主体': sdq.dplyd_old(),
601
+ },
545
602
  {
546
603
  '数据库名': '聚合数据',
547
604
  '集合名': '天猫_店铺来源_日数据',
@@ -665,5 +722,5 @@ def data_aggregation(service_databases=[{}], months=1, system_name=None,):
665
722
 
666
723
  if __name__ == '__main__':
667
724
  # data_aggregation(service_databases=[{'home_lx': 'mysql'}], months=1, system_name='home_lx')
668
- data_aggregation_one(service_databases=[{'company': 'mysql'}], months=10, system_name='company')
725
+ data_aggregation_one(service_databases=[{'company': 'mysql'}], months=12, system_name='company')
669
726
  # optimize_data.op_data(service_databases=[{'company': 'mysql'}], days=3650) # 立即启动对聚合数据的清理工作
mdbq/config/products.py CHANGED
@@ -17,6 +17,9 @@ class Products:
17
17
 
18
18
  def update_my_datas(self):
19
19
  my_datas = [
20
+ {
21
+ '平台': '天猫', '商品id': '830789689032', '上市年份': '2024年9月'
22
+ },
20
23
  {
21
24
  '平台': '天猫', '商品id': '822020840000', '上市年份': '2024年8月'
22
25
  },
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: mdbq
3
- Version: 1.4.7
3
+ Version: 1.4.9
4
4
  Home-page: https://pypi.org/project/mdbsql
5
5
  Author: xigua,
6
6
  Author-email: 2587125111@qq.com
@@ -1,11 +1,11 @@
1
1
  mdbq/__init__.py,sha256=Il5Q9ATdX8yXqVxtP_nYqUhExzxPC_qk_WXQ_4h0exg,16
2
2
  mdbq/__version__.py,sha256=y9Mp_8x0BCZSHsdLT_q5tX9wZwd5QgqrSIENLrb6vXA,62
3
3
  mdbq/aggregation/__init__.py,sha256=EeDqX2Aml6SPx8363J-v1lz0EcZtgwIBYyCJV6CcEDU,40
4
- mdbq/aggregation/aggregation.py,sha256=uGLS4Zn8oX0TmFxo2G_bDuA7hok4afiZajJZDLxmSNg,59528
4
+ mdbq/aggregation/aggregation.py,sha256=UThzLh2KTL91BpiXxiuy6Z-Nck6v_uqtNnHf3uu-BVs,59513
5
5
  mdbq/aggregation/df_types.py,sha256=oQJS2IBU3_IO6GMgbssHuC2yCjNnbta0QPGrFOwNLnU,7591
6
6
  mdbq/aggregation/mysql_types.py,sha256=3j_SUTi7qYJyY3JtV_lRLIyczIczmRPE_WaIrXiZ6Rw,11425
7
7
  mdbq/aggregation/optimize_data.py,sha256=u2Kl_MFtZueXJ57ycy4H2OhXD431RctUYJYCl637uT0,4176
8
- mdbq/aggregation/query_data.py,sha256=PBBbnwN8fHxd6H_k8gZygu41bFk0H4oL3sKULa9_YSM,31207
8
+ mdbq/aggregation/query_data.py,sha256=JRHChU4u6e64sZCJ8kfVFNq_FAVuz_kFLwkwBehc0Sg,35762
9
9
  mdbq/bdup/__init__.py,sha256=AkhsGk81SkG1c8FqDH5tRq-8MZmFobVbN60DTyukYTY,28
10
10
  mdbq/bdup/bdup.py,sha256=LAV0TgnQpc-LB-YuJthxb0U42_VkPidzQzAagan46lU,4234
11
11
  mdbq/clean/__init__.py,sha256=A1d6x3L27j4NtLgiFV5TANwEkLuaDfPHDQNrPBbNWtU,41
@@ -14,7 +14,7 @@ mdbq/company/__init__.py,sha256=qz8F_GsP_pMB5PblgJAUAMjasuZbOEp3qQOCB39E8f0,21
14
14
  mdbq/company/copysh.py,sha256=RWlQqfpqDiRO1QaVCbPhgAYSopnMoOgcnFhRi0TNFnM,17181
15
15
  mdbq/config/__init__.py,sha256=jso1oHcy6cJEfa7udS_9uO5X6kZLoPBF8l3wCYmr5dM,18
16
16
  mdbq/config/get_myconf.py,sha256=bp6bVARZVm3ANj1pmM9hLB8Ao539TUWeM9xxeSsBpzw,5994
17
- mdbq/config/products.py,sha256=9gqXJMsw8KKuD4Xs6krNgcF7AuWDvV7clI6wVi3QjcA,4260
17
+ mdbq/config/products.py,sha256=xJ5-5y3_yf0bU-w5dCe3X1O3iGjmRTTHAz9PFc_B9pU,4386
18
18
  mdbq/config/set_support.py,sha256=xkZCX6y9Bq1ppBpJAofld4B2YtchA7fl0eT3dx3CrSI,777
19
19
  mdbq/config/update_conf.py,sha256=taL3ZqKgiVWwUrDFuaYhim9a72Hm4BHRhhDscJTziR8,4535
20
20
  mdbq/dataframe/__init__.py,sha256=2HtCN8AdRj53teXDqzysC1h8aPL-mMFy561ESmhehGQ,22
@@ -35,7 +35,7 @@ mdbq/pbix/__init__.py,sha256=Trtfaynu9RjoTyLLYBN2xdRxTvm_zhCniUkVTAYwcjo,24
35
35
  mdbq/pbix/pbix_refresh.py,sha256=JUjKW3bNEyoMVfVfo77UhguvS5AWkixvVhDbw4_MHco,2396
36
36
  mdbq/pbix/refresh_all.py,sha256=tgy762608HMaXWynbOURIf2UVMuSPybzrDXQnOOcnZU,6102
37
37
  mdbq/spider/__init__.py,sha256=RBMFXGy_jd1HXZhngB2T2XTvJqki8P_Fr-pBcwijnew,18
38
- mdbq-1.4.7.dist-info/METADATA,sha256=LtBOaDQcn4v_dj9wjGnSYaoGqXAtzKDdllsXLlCjDFw,245
39
- mdbq-1.4.7.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
40
- mdbq-1.4.7.dist-info/top_level.txt,sha256=2FQ-uLnCSB-OwFiWntzmwosW3X2Xqsg0ewh1axsaylA,5
41
- mdbq-1.4.7.dist-info/RECORD,,
38
+ mdbq-1.4.9.dist-info/METADATA,sha256=dvW4SLr4_CITHSMOzrcQC3aMZNyvgqvqoOvUgIQQmyc,245
39
+ mdbq-1.4.9.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
40
+ mdbq-1.4.9.dist-info/top_level.txt,sha256=2FQ-uLnCSB-OwFiWntzmwosW3X2Xqsg0ewh1axsaylA,5
41
+ mdbq-1.4.9.dist-info/RECORD,,
File without changes