mdbq 4.0.44__py3-none-any.whl → 4.0.45__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
mdbq/__version__.py CHANGED
@@ -1 +1 @@
1
- VERSION = '4.0.44'
1
+ VERSION = '4.0.45'
@@ -24,7 +24,7 @@ host, port, username, password = parser.get_section_values(
24
24
  section='mysql',
25
25
  keys=['host', 'port', 'username', 'password'],
26
26
  )
27
- # host = 'localhost'
27
+ host = 'localhost'
28
28
  uld = uploader.MySQLUploader(username=username, password=password, host=host, port=int(port), pool_size=10)
29
29
 
30
30
  logger = mylogger.MyLogger(
@@ -1514,25 +1514,29 @@ class MysqlDatasQuery:
1514
1514
  end_date=end_date,
1515
1515
  projection=projection,
1516
1516
  )
1517
+ df.pop('data_sku')
1517
1518
  df['日期'] = pd.to_datetime(df['日期'], format='%Y-%m-%d', errors='ignore') # 转换日期列
1518
1519
  df_set['商品id'] = df_set['商品id'].astype('int64')
1519
1520
  df['商品id'] = df['商品id'].astype('int64')
1520
1521
  df_set.sort_values('商品id', ascending=False, ignore_index=True, inplace=True)
1521
1522
 
1523
+ # 仅保留最新日期的数据
1524
+ idx = df.groupby(['商品id'])['更新时间'].idxmax()
1525
+ df = df.loc[idx]
1526
+
1522
1527
  def check_year(item_id):
1523
1528
  for item in df_set.to_dict(orient='records'):
1524
1529
  if item_id > item['商品id']:
1525
1530
  return item['上市年份']
1526
1531
 
1527
1532
  df['上市年份'] = df['商品id'].apply(lambda x: check_year(x))
1528
- p = df.pop('上市年份')
1529
- df.insert(loc=5, column='上市年份', value=p)
1530
1533
  set_typ = {
1531
1534
  '日期': 'date',
1532
1535
  '店铺id': 'bigint',
1533
1536
  '店铺名称': 'varchar(255)',
1534
1537
  '商家id': 'bigint',
1535
1538
  '商品id': 'bigint',
1539
+ '上市年份': 'varchar(50)',
1536
1540
  '商品标题': 'varchar(255)',
1537
1541
  '商品链接': 'varchar(255)',
1538
1542
  '商品图片': 'varchar(255)',
@@ -1540,7 +1544,6 @@ class MysqlDatasQuery:
1540
1544
  '页面价': 'int',
1541
1545
  'data_sku': 'varchar(1000)',
1542
1546
  '更新时间': 'timestamp',
1543
- '上市年份': 'varchar(50)',
1544
1547
  }
1545
1548
  return df, {
1546
1549
  'db_name': db_name,
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: mdbq
3
- Version: 4.0.44
3
+ Version: 4.0.45
4
4
  Home-page: https://pypi.org/project/mdbq
5
5
  Author: xigua,
6
6
  Author-email: 2587125111@qq.com
@@ -1,7 +1,7 @@
1
1
  mdbq/__init__.py,sha256=Il5Q9ATdX8yXqVxtP_nYqUhExzxPC_qk_WXQ_4h0exg,16
2
- mdbq/__version__.py,sha256=Yq_JgKwKONwVexEyE66trDbripXgbesAkvt1eQ___20,18
2
+ mdbq/__version__.py,sha256=FkR4y0Q2ePf9_DJM8InzWHAQoyH_nonI89ug5PqBPvw,18
3
3
  mdbq/aggregation/__init__.py,sha256=EeDqX2Aml6SPx8363J-v1lz0EcZtgwIBYyCJV6CcEDU,40
4
- mdbq/aggregation/query_data.py,sha256=ZWLJghNiEtyA4rvgUqMCLorY0R4-Likd6i4mVMuOni0,170025
4
+ mdbq/aggregation/query_data.py,sha256=V67KBQNNK8Ayhqrgg8GGf8HGW0H8owjbbiwt07b1Qkw,170092
5
5
  mdbq/log/__init__.py,sha256=Mpbrav0s0ifLL7lVDAuePEi1hJKiSHhxcv1byBKDl5E,15
6
6
  mdbq/log/mylogger.py,sha256=kPe3wsQNaB1slfX-Z7VMqzZoMoqPfc7ylYXZDBeFzzI,24945
7
7
  mdbq/myconf/__init__.py,sha256=jso1oHcy6cJEfa7udS_9uO5X6kZLoPBF8l3wCYmr5dM,18
@@ -25,7 +25,7 @@ mdbq/redis/__init__.py,sha256=YtgBlVSMDphtpwYX248wGge1x-Ex_mMufz4-8W0XRmA,12
25
25
  mdbq/redis/getredis.py,sha256=vpBuNc22uj9Vr-_Dh25_wpwWM1e-072EAAIBdB_IpL0,23494
26
26
  mdbq/spider/__init__.py,sha256=RBMFXGy_jd1HXZhngB2T2XTvJqki8P_Fr-pBcwijnew,18
27
27
  mdbq/spider/aikucun.py,sha256=XptHjGzbout9IYzWAOQUpMMV5qEgLTU8pL1ZGt8oNEA,21868
28
- mdbq-4.0.44.dist-info/METADATA,sha256=6BCrO5mef08KVeODcA3rgk-gOsNtI_8_CTh0mghCKeE,364
29
- mdbq-4.0.44.dist-info/WHEEL,sha256=jB7zZ3N9hIM9adW7qlTAyycLYW9npaWKLRzaoVcLKcM,91
30
- mdbq-4.0.44.dist-info/top_level.txt,sha256=2FQ-uLnCSB-OwFiWntzmwosW3X2Xqsg0ewh1axsaylA,5
31
- mdbq-4.0.44.dist-info/RECORD,,
28
+ mdbq-4.0.45.dist-info/METADATA,sha256=l9QP6JJAwfO9i4vZpq8H6Z89M6VaOL58wotceJ4MaLY,364
29
+ mdbq-4.0.45.dist-info/WHEEL,sha256=jB7zZ3N9hIM9adW7qlTAyycLYW9npaWKLRzaoVcLKcM,91
30
+ mdbq-4.0.45.dist-info/top_level.txt,sha256=2FQ-uLnCSB-OwFiWntzmwosW3X2Xqsg0ewh1axsaylA,5
31
+ mdbq-4.0.45.dist-info/RECORD,,
File without changes