mdbq 4.0.44__py3-none-any.whl → 4.0.45__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- mdbq/__version__.py +1 -1
- mdbq/aggregation/query_data.py +7 -4
- {mdbq-4.0.44.dist-info → mdbq-4.0.45.dist-info}/METADATA +1 -1
- {mdbq-4.0.44.dist-info → mdbq-4.0.45.dist-info}/RECORD +6 -6
- {mdbq-4.0.44.dist-info → mdbq-4.0.45.dist-info}/WHEEL +0 -0
- {mdbq-4.0.44.dist-info → mdbq-4.0.45.dist-info}/top_level.txt +0 -0
mdbq/__version__.py
CHANGED
@@ -1 +1 @@
|
|
1
|
-
VERSION = '4.0.
|
1
|
+
VERSION = '4.0.45'
|
mdbq/aggregation/query_data.py
CHANGED
@@ -24,7 +24,7 @@ host, port, username, password = parser.get_section_values(
|
|
24
24
|
section='mysql',
|
25
25
|
keys=['host', 'port', 'username', 'password'],
|
26
26
|
)
|
27
|
-
|
27
|
+
host = 'localhost'
|
28
28
|
uld = uploader.MySQLUploader(username=username, password=password, host=host, port=int(port), pool_size=10)
|
29
29
|
|
30
30
|
logger = mylogger.MyLogger(
|
@@ -1514,25 +1514,29 @@ class MysqlDatasQuery:
|
|
1514
1514
|
end_date=end_date,
|
1515
1515
|
projection=projection,
|
1516
1516
|
)
|
1517
|
+
df.pop('data_sku')
|
1517
1518
|
df['日期'] = pd.to_datetime(df['日期'], format='%Y-%m-%d', errors='ignore') # 转换日期列
|
1518
1519
|
df_set['商品id'] = df_set['商品id'].astype('int64')
|
1519
1520
|
df['商品id'] = df['商品id'].astype('int64')
|
1520
1521
|
df_set.sort_values('商品id', ascending=False, ignore_index=True, inplace=True)
|
1521
1522
|
|
1523
|
+
# 仅保留最新日期的数据
|
1524
|
+
idx = df.groupby(['商品id'])['更新时间'].idxmax()
|
1525
|
+
df = df.loc[idx]
|
1526
|
+
|
1522
1527
|
def check_year(item_id):
|
1523
1528
|
for item in df_set.to_dict(orient='records'):
|
1524
1529
|
if item_id > item['商品id']:
|
1525
1530
|
return item['上市年份']
|
1526
1531
|
|
1527
1532
|
df['上市年份'] = df['商品id'].apply(lambda x: check_year(x))
|
1528
|
-
p = df.pop('上市年份')
|
1529
|
-
df.insert(loc=5, column='上市年份', value=p)
|
1530
1533
|
set_typ = {
|
1531
1534
|
'日期': 'date',
|
1532
1535
|
'店铺id': 'bigint',
|
1533
1536
|
'店铺名称': 'varchar(255)',
|
1534
1537
|
'商家id': 'bigint',
|
1535
1538
|
'商品id': 'bigint',
|
1539
|
+
'上市年份': 'varchar(50)',
|
1536
1540
|
'商品标题': 'varchar(255)',
|
1537
1541
|
'商品链接': 'varchar(255)',
|
1538
1542
|
'商品图片': 'varchar(255)',
|
@@ -1540,7 +1544,6 @@ class MysqlDatasQuery:
|
|
1540
1544
|
'页面价': 'int',
|
1541
1545
|
'data_sku': 'varchar(1000)',
|
1542
1546
|
'更新时间': 'timestamp',
|
1543
|
-
'上市年份': 'varchar(50)',
|
1544
1547
|
}
|
1545
1548
|
return df, {
|
1546
1549
|
'db_name': db_name,
|
@@ -1,7 +1,7 @@
|
|
1
1
|
mdbq/__init__.py,sha256=Il5Q9ATdX8yXqVxtP_nYqUhExzxPC_qk_WXQ_4h0exg,16
|
2
|
-
mdbq/__version__.py,sha256=
|
2
|
+
mdbq/__version__.py,sha256=FkR4y0Q2ePf9_DJM8InzWHAQoyH_nonI89ug5PqBPvw,18
|
3
3
|
mdbq/aggregation/__init__.py,sha256=EeDqX2Aml6SPx8363J-v1lz0EcZtgwIBYyCJV6CcEDU,40
|
4
|
-
mdbq/aggregation/query_data.py,sha256=
|
4
|
+
mdbq/aggregation/query_data.py,sha256=V67KBQNNK8Ayhqrgg8GGf8HGW0H8owjbbiwt07b1Qkw,170092
|
5
5
|
mdbq/log/__init__.py,sha256=Mpbrav0s0ifLL7lVDAuePEi1hJKiSHhxcv1byBKDl5E,15
|
6
6
|
mdbq/log/mylogger.py,sha256=kPe3wsQNaB1slfX-Z7VMqzZoMoqPfc7ylYXZDBeFzzI,24945
|
7
7
|
mdbq/myconf/__init__.py,sha256=jso1oHcy6cJEfa7udS_9uO5X6kZLoPBF8l3wCYmr5dM,18
|
@@ -25,7 +25,7 @@ mdbq/redis/__init__.py,sha256=YtgBlVSMDphtpwYX248wGge1x-Ex_mMufz4-8W0XRmA,12
|
|
25
25
|
mdbq/redis/getredis.py,sha256=vpBuNc22uj9Vr-_Dh25_wpwWM1e-072EAAIBdB_IpL0,23494
|
26
26
|
mdbq/spider/__init__.py,sha256=RBMFXGy_jd1HXZhngB2T2XTvJqki8P_Fr-pBcwijnew,18
|
27
27
|
mdbq/spider/aikucun.py,sha256=XptHjGzbout9IYzWAOQUpMMV5qEgLTU8pL1ZGt8oNEA,21868
|
28
|
-
mdbq-4.0.
|
29
|
-
mdbq-4.0.
|
30
|
-
mdbq-4.0.
|
31
|
-
mdbq-4.0.
|
28
|
+
mdbq-4.0.45.dist-info/METADATA,sha256=l9QP6JJAwfO9i4vZpq8H6Z89M6VaOL58wotceJ4MaLY,364
|
29
|
+
mdbq-4.0.45.dist-info/WHEEL,sha256=jB7zZ3N9hIM9adW7qlTAyycLYW9npaWKLRzaoVcLKcM,91
|
30
|
+
mdbq-4.0.45.dist-info/top_level.txt,sha256=2FQ-uLnCSB-OwFiWntzmwosW3X2Xqsg0ewh1axsaylA,5
|
31
|
+
mdbq-4.0.45.dist-info/RECORD,,
|
File without changes
|
File without changes
|