mdbq 3.2.5__py3-none-any.whl → 3.2.7__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- mdbq/dataframe/converter.py +2 -1
- mdbq/mysql/mysql.py +5 -4
- {mdbq-3.2.5.dist-info → mdbq-3.2.7.dist-info}/METADATA +1 -1
- {mdbq-3.2.5.dist-info → mdbq-3.2.7.dist-info}/RECORD +6 -6
- {mdbq-3.2.5.dist-info → mdbq-3.2.7.dist-info}/WHEEL +1 -1
- {mdbq-3.2.5.dist-info → mdbq-3.2.7.dist-info}/top_level.txt +0 -0
mdbq/dataframe/converter.py
CHANGED
@@ -32,7 +32,8 @@ class DataFrameConverter(object):
|
|
32
32
|
|
33
33
|
# dtypes = df.dtypes.apply(str).to_dict() # 将 dataframe 数据类型转为字典形式
|
34
34
|
df.replace([np.inf, -np.inf], '0', inplace=True) # 清理一些非法值
|
35
|
-
df.replace(to_replace=['\\N', '-', '--', '', 'nan', 'NAN'], value='0', regex=False, inplace=True) # 替换掉特殊字符
|
35
|
+
# df.replace(to_replace=['\\N', '-', '--', '', 'nan', 'NAN'], value='0', regex=False, inplace=True) # 替换掉特殊字符
|
36
|
+
df.replace(to_replace=['\\N', '', 'nan', 'NAN'], value='0', regex=False, inplace=True) # 替换掉特殊字符
|
36
37
|
# df.replace(to_replace=[','], value='', regex=True, inplace=True)
|
37
38
|
df.replace(to_replace=['="'], value='', regex=True, inplace=True) # ="和"不可以放在一起清洗, 因为有: id=86785565
|
38
39
|
df.replace(to_replace=['"'], value='', regex=True, inplace=True)
|
mdbq/mysql/mysql.py
CHANGED
@@ -327,9 +327,9 @@ class MysqlUpload:
|
|
327
327
|
if str(v) == '':
|
328
328
|
v = 0
|
329
329
|
v = str(v)
|
330
|
-
v = re.sub('^-$|^--$|^nan$|^null$', '0', v, re.I)
|
330
|
+
# v = re.sub('^-$|^--$|^nan$|^null$', '0', v, re.I)
|
331
331
|
# v = re.sub(',|="|"', '', v, re.I)
|
332
|
-
v = re.sub('
|
332
|
+
v = re.sub('^="|"$', '', v, re.I)
|
333
333
|
if re.findall(r'^[-+]?\d+\.?\d*%$', v):
|
334
334
|
v = str(float(v.rstrip("%")) / 100)
|
335
335
|
|
@@ -377,8 +377,9 @@ class MysqlUpload:
|
|
377
377
|
def cover_df(self, df):
|
378
378
|
""" 清理 df 的值和列名 """
|
379
379
|
df.replace([np.inf, -np.inf], '0', inplace=True) # 清理一些非法值
|
380
|
-
df.replace(to_replace=['\\N', '-', '--', '', 'nan', 'NAN'], value='0', regex=False, inplace=True) # 替换掉特殊字符
|
381
|
-
df.replace(to_replace=[','], value='', regex=
|
380
|
+
# df.replace(to_replace=['\\N', '-', '--', '', 'nan', 'NAN'], value='0', regex=False, inplace=True) # 替换掉特殊字符
|
381
|
+
df.replace(to_replace=['\\N', '', 'nan', 'NAN'], value='0', regex=False, inplace=True) # 替换掉特殊字符
|
382
|
+
# df.replace(to_replace=[','], value='', regex=True, inplace=True)
|
382
383
|
df.replace(to_replace=['="'], value='', regex=True, inplace=True) # ="和"不可以放在一起清洗, 因为有: id=86785565
|
383
384
|
df.replace(to_replace=['"'], value='', regex=True, inplace=True)
|
384
385
|
cols = df.columns.tolist()
|
@@ -22,13 +22,13 @@ mdbq/config/products.py,sha256=Ab6eaAUMUtjRL8z9NvYukyCjp3nAi4OYISY_IdPhAJ0,6279
|
|
22
22
|
mdbq/config/set_support.py,sha256=xkZCX6y9Bq1ppBpJAofld4B2YtchA7fl0eT3dx3CrSI,777
|
23
23
|
mdbq/config/update_conf.py,sha256=taL3ZqKgiVWwUrDFuaYhim9a72Hm4BHRhhDscJTziR8,4535
|
24
24
|
mdbq/dataframe/__init__.py,sha256=2HtCN8AdRj53teXDqzysC1h8aPL-mMFy561ESmhehGQ,22
|
25
|
-
mdbq/dataframe/converter.py,sha256=
|
25
|
+
mdbq/dataframe/converter.py,sha256=lETYhT7KXlWzWwqguqhk6vI6kj4rnOBEW1lhqKy2Abc,5035
|
26
26
|
mdbq/log/__init__.py,sha256=Mpbrav0s0ifLL7lVDAuePEi1hJKiSHhxcv1byBKDl5E,15
|
27
27
|
mdbq/log/mylogger.py,sha256=oaT7Bp-Hb9jZt52seP3ISUuxVcI19s4UiqTeouScBO0,3258
|
28
28
|
mdbq/mongo/__init__.py,sha256=SILt7xMtQIQl_m-ik9WLtJSXIVf424iYgCfE_tnQFbw,13
|
29
29
|
mdbq/mongo/mongo.py,sha256=v9qvrp6p1ZRWuPpbSilqveiE0FEcZF7U5xUPI0RN4xs,31880
|
30
30
|
mdbq/mysql/__init__.py,sha256=A_DPJyAoEvTSFojiI2e94zP0FKtCkkwKP1kYUCSyQzo,11
|
31
|
-
mdbq/mysql/mysql.py,sha256=
|
31
|
+
mdbq/mysql/mysql.py,sha256=shsMl3B9dJqIyztekHt0L01XP7_nLEEY1jsEkCm9FMc,62855
|
32
32
|
mdbq/mysql/recheck_mysql.py,sha256=rgTpvDMWYTyEn7UQdlig-pdXDluTgiU8JG6lkMh8DV0,8665
|
33
33
|
mdbq/mysql/s_query.py,sha256=MbIprZ4yJDAZ9AahZPzl7hqS695Vs0P-AJNwAtA_EEc,9287
|
34
34
|
mdbq/mysql/year_month_day.py,sha256=VgewoE2pJxK7ErjfviL_SMTN77ki8GVbTUcao3vFUCE,1523
|
@@ -46,7 +46,7 @@ mdbq/req_post/__init__.py,sha256=jso1oHcy6cJEfa7udS_9uO5X6kZLoPBF8l3wCYmr5dM,18
|
|
46
46
|
mdbq/req_post/req_tb.py,sha256=qg7pet73IgKGmCwxaeUyImJIoeK_pBQT9BBKD7fkBNg,36160
|
47
47
|
mdbq/spider/__init__.py,sha256=RBMFXGy_jd1HXZhngB2T2XTvJqki8P_Fr-pBcwijnew,18
|
48
48
|
mdbq/spider/aikucun.py,sha256=48isoL6nEi_uniV-ja2HwYAI7O8D1i1goO4SzBwDGSU,19036
|
49
|
-
mdbq-3.2.
|
50
|
-
mdbq-3.2.
|
51
|
-
mdbq-3.2.
|
52
|
-
mdbq-3.2.
|
49
|
+
mdbq-3.2.7.dist-info/METADATA,sha256=_PvMX_qrt7C5VTFsKDLiS169BwcfwP3-MZgBQEp9SA0,243
|
50
|
+
mdbq-3.2.7.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
|
51
|
+
mdbq-3.2.7.dist-info/top_level.txt,sha256=2FQ-uLnCSB-OwFiWntzmwosW3X2Xqsg0ewh1axsaylA,5
|
52
|
+
mdbq-3.2.7.dist-info/RECORD,,
|
File without changes
|