mdbq 4.0.43__py3-none-any.whl → 4.0.45__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- mdbq/__version__.py +1 -1
- mdbq/aggregation/query_data.py +9 -7
- {mdbq-4.0.43.dist-info → mdbq-4.0.45.dist-info}/METADATA +1 -1
- {mdbq-4.0.43.dist-info → mdbq-4.0.45.dist-info}/RECORD +6 -6
- {mdbq-4.0.43.dist-info → mdbq-4.0.45.dist-info}/WHEEL +0 -0
- {mdbq-4.0.43.dist-info → mdbq-4.0.45.dist-info}/top_level.txt +0 -0
mdbq/__version__.py
CHANGED
@@ -1 +1 @@
|
|
1
|
-
VERSION = '4.0.
|
1
|
+
VERSION = '4.0.45'
|
mdbq/aggregation/query_data.py
CHANGED
@@ -24,7 +24,7 @@ host, port, username, password = parser.get_section_values(
|
|
24
24
|
section='mysql',
|
25
25
|
keys=['host', 'port', 'username', 'password'],
|
26
26
|
)
|
27
|
-
|
27
|
+
host = 'localhost'
|
28
28
|
uld = uploader.MySQLUploader(username=username, password=password, host=host, port=int(port), pool_size=10)
|
29
29
|
|
30
30
|
logger = mylogger.MyLogger(
|
@@ -1514,27 +1514,29 @@ class MysqlDatasQuery:
|
|
1514
1514
|
end_date=end_date,
|
1515
1515
|
projection=projection,
|
1516
1516
|
)
|
1517
|
+
df.pop('data_sku')
|
1517
1518
|
df['日期'] = pd.to_datetime(df['日期'], format='%Y-%m-%d', errors='ignore') # 转换日期列
|
1518
|
-
df = df[df['日期'] == pd.to_datetime('2024-12-12')]
|
1519
|
-
|
1520
1519
|
df_set['商品id'] = df_set['商品id'].astype('int64')
|
1521
1520
|
df['商品id'] = df['商品id'].astype('int64')
|
1522
1521
|
df_set.sort_values('商品id', ascending=False, ignore_index=True, inplace=True)
|
1523
1522
|
|
1523
|
+
# 仅保留最新日期的数据
|
1524
|
+
idx = df.groupby(['商品id'])['更新时间'].idxmax()
|
1525
|
+
df = df.loc[idx]
|
1526
|
+
|
1524
1527
|
def check_year(item_id):
|
1525
1528
|
for item in df_set.to_dict(orient='records'):
|
1526
1529
|
if item_id > item['商品id']:
|
1527
1530
|
return item['上市年份']
|
1528
1531
|
|
1529
1532
|
df['上市年份'] = df['商品id'].apply(lambda x: check_year(x))
|
1530
|
-
p = df.pop('上市年份')
|
1531
|
-
df.insert(loc=5, column='上市年份', value=p)
|
1532
1533
|
set_typ = {
|
1533
1534
|
'日期': 'date',
|
1534
1535
|
'店铺id': 'bigint',
|
1535
1536
|
'店铺名称': 'varchar(255)',
|
1536
1537
|
'商家id': 'bigint',
|
1537
1538
|
'商品id': 'bigint',
|
1539
|
+
'上市年份': 'varchar(50)',
|
1538
1540
|
'商品标题': 'varchar(255)',
|
1539
1541
|
'商品链接': 'varchar(255)',
|
1540
1542
|
'商品图片': 'varchar(255)',
|
@@ -1542,7 +1544,6 @@ class MysqlDatasQuery:
|
|
1542
1544
|
'页面价': 'int',
|
1543
1545
|
'data_sku': 'varchar(1000)',
|
1544
1546
|
'更新时间': 'timestamp',
|
1545
|
-
'上市年份': 'varchar(50)',
|
1546
1547
|
}
|
1547
1548
|
return df, {
|
1548
1549
|
'db_name': db_name,
|
@@ -3742,6 +3743,7 @@ def query3(months=1, download_manager=None):
|
|
3742
3743
|
sdq = MysqlDatasQuery(download_manager=download_manager) # 实例化数据处理类
|
3743
3744
|
sdq.months = months # 设置数据周期, 1 表示近 2 个月
|
3744
3745
|
sdq.spph(db_name='聚合数据', table_name='天猫_商品排行')
|
3746
|
+
sdq.item_up(db_name='聚合数据', table_name='淘宝店铺货品')
|
3745
3747
|
|
3746
3748
|
|
3747
3749
|
def main(months=3):
|
@@ -3779,4 +3781,4 @@ if __name__ == '__main__':
|
|
3779
3781
|
)
|
3780
3782
|
sdq = MysqlDatasQuery(download_manager=download_manager)
|
3781
3783
|
sdq.months = 3
|
3782
|
-
sdq.
|
3784
|
+
sdq.item_up(db_name='聚合数据', table_name='淘宝店铺货品')
|
@@ -1,7 +1,7 @@
|
|
1
1
|
mdbq/__init__.py,sha256=Il5Q9ATdX8yXqVxtP_nYqUhExzxPC_qk_WXQ_4h0exg,16
|
2
|
-
mdbq/__version__.py,sha256=
|
2
|
+
mdbq/__version__.py,sha256=FkR4y0Q2ePf9_DJM8InzWHAQoyH_nonI89ug5PqBPvw,18
|
3
3
|
mdbq/aggregation/__init__.py,sha256=EeDqX2Aml6SPx8363J-v1lz0EcZtgwIBYyCJV6CcEDU,40
|
4
|
-
mdbq/aggregation/query_data.py,sha256=
|
4
|
+
mdbq/aggregation/query_data.py,sha256=V67KBQNNK8Ayhqrgg8GGf8HGW0H8owjbbiwt07b1Qkw,170092
|
5
5
|
mdbq/log/__init__.py,sha256=Mpbrav0s0ifLL7lVDAuePEi1hJKiSHhxcv1byBKDl5E,15
|
6
6
|
mdbq/log/mylogger.py,sha256=kPe3wsQNaB1slfX-Z7VMqzZoMoqPfc7ylYXZDBeFzzI,24945
|
7
7
|
mdbq/myconf/__init__.py,sha256=jso1oHcy6cJEfa7udS_9uO5X6kZLoPBF8l3wCYmr5dM,18
|
@@ -25,7 +25,7 @@ mdbq/redis/__init__.py,sha256=YtgBlVSMDphtpwYX248wGge1x-Ex_mMufz4-8W0XRmA,12
|
|
25
25
|
mdbq/redis/getredis.py,sha256=vpBuNc22uj9Vr-_Dh25_wpwWM1e-072EAAIBdB_IpL0,23494
|
26
26
|
mdbq/spider/__init__.py,sha256=RBMFXGy_jd1HXZhngB2T2XTvJqki8P_Fr-pBcwijnew,18
|
27
27
|
mdbq/spider/aikucun.py,sha256=XptHjGzbout9IYzWAOQUpMMV5qEgLTU8pL1ZGt8oNEA,21868
|
28
|
-
mdbq-4.0.
|
29
|
-
mdbq-4.0.
|
30
|
-
mdbq-4.0.
|
31
|
-
mdbq-4.0.
|
28
|
+
mdbq-4.0.45.dist-info/METADATA,sha256=l9QP6JJAwfO9i4vZpq8H6Z89M6VaOL58wotceJ4MaLY,364
|
29
|
+
mdbq-4.0.45.dist-info/WHEEL,sha256=jB7zZ3N9hIM9adW7qlTAyycLYW9npaWKLRzaoVcLKcM,91
|
30
|
+
mdbq-4.0.45.dist-info/top_level.txt,sha256=2FQ-uLnCSB-OwFiWntzmwosW3X2Xqsg0ewh1axsaylA,5
|
31
|
+
mdbq-4.0.45.dist-info/RECORD,,
|
File without changes
|
File without changes
|