mdbq 4.0.30__py3-none-any.whl → 4.0.32__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- mdbq/__version__.py +1 -1
- mdbq/aggregation/query_data.py +12 -34
- mdbq/myconf/myconf.py +28 -0
- mdbq/mysql/deduplicator.py +5 -16
- mdbq/mysql/s_query.py +3 -3
- mdbq/mysql/unique_.py +2 -2
- mdbq/mysql/uploader.py +8 -0
- mdbq/other/download_sku_picture.py +55 -33
- {mdbq-4.0.30.dist-info → mdbq-4.0.32.dist-info}/METADATA +1 -1
- {mdbq-4.0.30.dist-info → mdbq-4.0.32.dist-info}/RECORD +12 -13
- mdbq/myconf/myconf_bak.py +0 -816
- {mdbq-4.0.30.dist-info → mdbq-4.0.32.dist-info}/WHEEL +0 -0
- {mdbq-4.0.30.dist-info → mdbq-4.0.32.dist-info}/top_level.txt +0 -0
@@ -18,7 +18,7 @@ from selenium.webdriver.common.by import By
|
|
18
18
|
from selenium.webdriver.support import expected_conditions as EC
|
19
19
|
from selenium.webdriver.chrome.service import Service
|
20
20
|
from mdbq.myconf import myconf
|
21
|
-
from mdbq.mysql import
|
21
|
+
from mdbq.mysql import uploader
|
22
22
|
from mdbq.mysql import s_query
|
23
23
|
from mdbq.other import ua_sj
|
24
24
|
import requests
|
@@ -54,7 +54,6 @@ host, port, username, password = parser.get_section_values(
|
|
54
54
|
section='mysql',
|
55
55
|
keys=['host', 'port', 'username', 'password'],
|
56
56
|
)
|
57
|
-
m_engine = mysql.MysqlUpload(username=username, password=password, host=host, port=int(port), charset='utf8mb4')
|
58
57
|
|
59
58
|
if not username:
|
60
59
|
print(f'找不到主机:')
|
@@ -816,17 +815,24 @@ def main(service_name, database):
|
|
816
815
|
s.each_page() # 根据 urls 获取每个商品数据并更新为 df
|
817
816
|
tb_driver2.quit()
|
818
817
|
|
819
|
-
|
820
|
-
|
821
|
-
|
822
|
-
|
823
|
-
|
824
|
-
|
825
|
-
|
826
|
-
|
827
|
-
|
828
|
-
|
829
|
-
|
818
|
+
with uploader.MySQLUploader(username=username, password=password, host=host, port=int(port), pool_size=2) as uld:
|
819
|
+
upload_result = uld.upload_data(
|
820
|
+
db_name='属性设置2',
|
821
|
+
table_name='天猫商品sku信息',
|
822
|
+
data=s.df,
|
823
|
+
set_typ={}, # 定义列和数据类型
|
824
|
+
primary_keys=[], # 创建唯一主键
|
825
|
+
check_duplicate=False, # 检查重复数据
|
826
|
+
update_on_duplicate=False, # 遇到重复时更新数据,默认 False 跳过
|
827
|
+
duplicate_columns=[], # 指定排重的组合键
|
828
|
+
allow_null=False, # 允许插入空值
|
829
|
+
partition_by=None, # 按年/月分表
|
830
|
+
partition_date_column='日期', # 用于分表的日期列名,默认为'日期'
|
831
|
+
auto_create=True, # 表不存在时自动创建, 默认参数不要更改
|
832
|
+
indexes=[], # 指定索引列
|
833
|
+
transaction_mode='row', # 事务模式
|
834
|
+
unique_keys=[[]], # 唯一约束列表
|
835
|
+
)
|
830
836
|
|
831
837
|
|
832
838
|
def main2(service_name, database):
|
@@ -896,16 +902,24 @@ def download_sku(service_name='company', database='mysql', db_name='属性设置
|
|
896
902
|
tb_driver2.quit()
|
897
903
|
|
898
904
|
# 回传数据库
|
899
|
-
|
900
|
-
|
901
|
-
|
902
|
-
|
903
|
-
|
904
|
-
|
905
|
-
|
906
|
-
|
907
|
-
|
908
|
-
|
905
|
+
with uploader.MySQLUploader(username=username, password=password, host=host, port=int(port), pool_size=2) as uld:
|
906
|
+
upload_result = uld.upload_data(
|
907
|
+
db_name=table_name,
|
908
|
+
table_name=table_name,
|
909
|
+
data=s.df,
|
910
|
+
set_typ={}, # 定义列和数据类型
|
911
|
+
primary_keys=[], # 创建唯一主键
|
912
|
+
check_duplicate=False, # 检查重复数据
|
913
|
+
update_on_duplicate=False, # 遇到重复时更新数据,默认 False 跳过
|
914
|
+
duplicate_columns=[], # 指定排重的组合键
|
915
|
+
allow_null=False, # 允许插入空值
|
916
|
+
partition_by=None, # 按年/月分表
|
917
|
+
partition_date_column='日期', # 用于分表的日期列名,默认为'日期'
|
918
|
+
auto_create=True, # 表不存在时自动创建, 默认参数不要更改
|
919
|
+
indexes=[], # 指定索引列
|
920
|
+
transaction_mode='row', # 事务模式
|
921
|
+
unique_keys=[[]], # 唯一约束列表
|
922
|
+
)
|
909
923
|
|
910
924
|
# 从数据库中读取数据,并下载素材到本地
|
911
925
|
|
@@ -935,16 +949,24 @@ def download_sku(service_name='company', database='mysql', db_name='属性设置
|
|
935
949
|
df['获取与下载'] = df.apply(lambda x: '已下载' if x['sku编码'] in d.finish_download else x['获取与下载'], axis=1)
|
936
950
|
|
937
951
|
# 回传数据库
|
938
|
-
|
939
|
-
|
940
|
-
|
941
|
-
|
942
|
-
|
943
|
-
|
944
|
-
|
945
|
-
|
946
|
-
|
947
|
-
|
952
|
+
with uploader.MySQLUploader(username=username, password=password, host=host, port=int(port), pool_size=2) as uld:
|
953
|
+
upload_result = uld.upload_data(
|
954
|
+
db_name=db_name,
|
955
|
+
table_name=table_name,
|
956
|
+
data=df,
|
957
|
+
set_typ={}, # 定义列和数据类型
|
958
|
+
primary_keys=[], # 创建唯一主键
|
959
|
+
check_duplicate=False, # 检查重复数据
|
960
|
+
update_on_duplicate=False, # 遇到重复时更新数据,默认 False 跳过
|
961
|
+
duplicate_columns=[], # 指定排重的组合键
|
962
|
+
allow_null=False, # 允许插入空值
|
963
|
+
partition_by=None, # 按年/月分表
|
964
|
+
partition_date_column='日期', # 用于分表的日期列名,默认为'日期'
|
965
|
+
auto_create=True, # 表不存在时自动创建, 默认参数不要更改
|
966
|
+
indexes=[], # 指定索引列
|
967
|
+
transaction_mode='row', # 事务模式
|
968
|
+
unique_keys=[[]], # 唯一约束列表
|
969
|
+
)
|
948
970
|
|
949
971
|
|
950
972
|
def download_spu(username, password, host, port, heads=0, col_name='白底图', save_path=os.path.join(upload_path, '商品id_商家编码_图片'), ):
|
@@ -1,20 +1,19 @@
|
|
1
1
|
mdbq/__init__.py,sha256=Il5Q9ATdX8yXqVxtP_nYqUhExzxPC_qk_WXQ_4h0exg,16
|
2
|
-
mdbq/__version__.py,sha256=
|
2
|
+
mdbq/__version__.py,sha256=JlP9c4CD0Z8Ewghucau-8dDN36XOz-Fzk6Lsmjua5AY,18
|
3
3
|
mdbq/aggregation/__init__.py,sha256=EeDqX2Aml6SPx8363J-v1lz0EcZtgwIBYyCJV6CcEDU,40
|
4
|
-
mdbq/aggregation/query_data.py,sha256=
|
4
|
+
mdbq/aggregation/query_data.py,sha256=JrIoYIQpwFETAZ_KG7RKSO4aoLcegHwKT8kiktChOdk,164705
|
5
5
|
mdbq/log/__init__.py,sha256=Mpbrav0s0ifLL7lVDAuePEi1hJKiSHhxcv1byBKDl5E,15
|
6
6
|
mdbq/log/mylogger.py,sha256=9w_o5mYB3FooIxobq_lSa6oCYTKIhPxDFox-jeLtUHI,21714
|
7
7
|
mdbq/myconf/__init__.py,sha256=jso1oHcy6cJEfa7udS_9uO5X6kZLoPBF8l3wCYmr5dM,18
|
8
|
-
mdbq/myconf/myconf.py,sha256=
|
9
|
-
mdbq/myconf/myconf_bak.py,sha256=39tLUBVlWQZzQfrwk7YoLEfipo11fpwWjaLBHcUt2qM,33341
|
8
|
+
mdbq/myconf/myconf.py,sha256=rHvQCnQRKhQ49AZBke-Z4v28hyOLmHt4MylIuB0H6yA,33516
|
10
9
|
mdbq/mysql/__init__.py,sha256=A_DPJyAoEvTSFojiI2e94zP0FKtCkkwKP1kYUCSyQzo,11
|
11
|
-
mdbq/mysql/deduplicator.py,sha256=
|
10
|
+
mdbq/mysql/deduplicator.py,sha256=YgOUkjLEm8DmH_p-du-MTnR3gTFztjUoaY3b-QklnR4,73077
|
12
11
|
mdbq/mysql/mysql.py,sha256=pDg771xBugCMSTWeskIFTi3pFLgaqgyG3smzf-86Wn8,56772
|
13
|
-
mdbq/mysql/s_query.py,sha256=
|
14
|
-
mdbq/mysql/unique_.py,sha256=
|
15
|
-
mdbq/mysql/uploader.py,sha256=
|
12
|
+
mdbq/mysql/s_query.py,sha256=hQpoZ868hxDQpZ-im5Kmmixdh0Khkzj-MrVxkUTU3Kg,44984
|
13
|
+
mdbq/mysql/unique_.py,sha256=MaztT-WIyEQUs-OOYY4pFulgHVcXR1BfCy3QUz0XM_U,21127
|
14
|
+
mdbq/mysql/uploader.py,sha256=_c_8t5Cx2qbtyOLtii2Gv7vpTlpawWjrB_9zBz1MaC4,81507
|
16
15
|
mdbq/other/__init__.py,sha256=jso1oHcy6cJEfa7udS_9uO5X6kZLoPBF8l3wCYmr5dM,18
|
17
|
-
mdbq/other/download_sku_picture.py,sha256=
|
16
|
+
mdbq/other/download_sku_picture.py,sha256=X66sVdvVgzoNzmgVJyPtd7bjEvctEKtLPblEPF65EWc,46940
|
18
17
|
mdbq/other/otk.py,sha256=iclBIFbQbhlqzUbcMMoePXBpcP1eZ06ZtjnhcA_EbmE,7241
|
19
18
|
mdbq/other/pov_city.py,sha256=AEOmCOzOwyjHi9LLZWPKi6DUuSC-_M163664I52u9qw,21050
|
20
19
|
mdbq/other/ua_sj.py,sha256=JuVYzc_5QZ9s_oQSrTHVKkQv4S_7-CWx4oIKOARn_9U,22178
|
@@ -25,7 +24,7 @@ mdbq/redis/__init__.py,sha256=YtgBlVSMDphtpwYX248wGge1x-Ex_mMufz4-8W0XRmA,12
|
|
25
24
|
mdbq/redis/getredis.py,sha256=vpBuNc22uj9Vr-_Dh25_wpwWM1e-072EAAIBdB_IpL0,23494
|
26
25
|
mdbq/spider/__init__.py,sha256=RBMFXGy_jd1HXZhngB2T2XTvJqki8P_Fr-pBcwijnew,18
|
27
26
|
mdbq/spider/aikucun.py,sha256=XptHjGzbout9IYzWAOQUpMMV5qEgLTU8pL1ZGt8oNEA,21868
|
28
|
-
mdbq-4.0.
|
29
|
-
mdbq-4.0.
|
30
|
-
mdbq-4.0.
|
31
|
-
mdbq-4.0.
|
27
|
+
mdbq-4.0.32.dist-info/METADATA,sha256=PILyHn6uBC6wAxIFcw6M_xwrLb8t4n3Htvbj33vGjsI,364
|
28
|
+
mdbq-4.0.32.dist-info/WHEEL,sha256=jB7zZ3N9hIM9adW7qlTAyycLYW9npaWKLRzaoVcLKcM,91
|
29
|
+
mdbq-4.0.32.dist-info/top_level.txt,sha256=2FQ-uLnCSB-OwFiWntzmwosW3X2Xqsg0ewh1axsaylA,5
|
30
|
+
mdbq-4.0.32.dist-info/RECORD,,
|