datamarket 0.6.0__py3-none-any.whl → 0.10.3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of datamarket might be problematic. Click here for more details.
- datamarket/__init__.py +0 -1
- datamarket/exceptions/__init__.py +1 -0
- datamarket/exceptions/main.py +118 -0
- datamarket/interfaces/alchemy.py +1934 -25
- datamarket/interfaces/aws.py +81 -14
- datamarket/interfaces/azure.py +127 -0
- datamarket/interfaces/drive.py +60 -10
- datamarket/interfaces/ftp.py +37 -14
- datamarket/interfaces/llm.py +1220 -0
- datamarket/interfaces/nominatim.py +314 -42
- datamarket/interfaces/peerdb.py +272 -104
- datamarket/interfaces/proxy.py +354 -50
- datamarket/interfaces/tinybird.py +7 -15
- datamarket/params/nominatim.py +439 -0
- datamarket/utils/__init__.py +1 -1
- datamarket/utils/airflow.py +10 -7
- datamarket/utils/alchemy.py +2 -1
- datamarket/utils/logs.py +88 -0
- datamarket/utils/main.py +138 -10
- datamarket/utils/nominatim.py +201 -0
- datamarket/utils/playwright/__init__.py +0 -0
- datamarket/utils/playwright/async_api.py +274 -0
- datamarket/utils/playwright/sync_api.py +281 -0
- datamarket/utils/requests.py +655 -0
- datamarket/utils/selenium.py +6 -12
- datamarket/utils/strings/__init__.py +1 -0
- datamarket/utils/strings/normalization.py +217 -0
- datamarket/utils/strings/obfuscation.py +153 -0
- datamarket/utils/strings/standardization.py +40 -0
- datamarket/utils/typer.py +2 -1
- datamarket/utils/types.py +1 -0
- datamarket-0.10.3.dist-info/METADATA +172 -0
- datamarket-0.10.3.dist-info/RECORD +38 -0
- {datamarket-0.6.0.dist-info → datamarket-0.10.3.dist-info}/WHEEL +1 -2
- datamarket-0.6.0.dist-info/METADATA +0 -49
- datamarket-0.6.0.dist-info/RECORD +0 -24
- datamarket-0.6.0.dist-info/top_level.txt +0 -1
- {datamarket-0.6.0.dist-info → datamarket-0.10.3.dist-info/licenses}/LICENSE +0 -0
|
@@ -1,49 +0,0 @@
|
|
|
1
|
-
Metadata-Version: 2.1
|
|
2
|
-
Name: datamarket
|
|
3
|
-
Version: 0.6.0
|
|
4
|
-
Summary: Utilities that integrate advance scraping knowledge into just one library.
|
|
5
|
-
Home-page: https://github.com/Data-Market/datamarket
|
|
6
|
-
Author: DataMarket
|
|
7
|
-
Author-email: techsupport@datamarket.es
|
|
8
|
-
Project-URL: Website, https://datamarket.es
|
|
9
|
-
Classifier: Programming Language :: Python :: 3
|
|
10
|
-
Classifier: License :: OSI Approved :: GNU General Public License v3 (GPLv3)
|
|
11
|
-
Classifier: Operating System :: OS Independent
|
|
12
|
-
Requires-Python: >=3.7
|
|
13
|
-
Description-Content-Type: text/markdown
|
|
14
|
-
License-File: LICENSE
|
|
15
|
-
Requires-Dist: sqlalchemy
|
|
16
|
-
Requires-Dist: clickhouse-driver
|
|
17
|
-
Requires-Dist: requests[socks]
|
|
18
|
-
Requires-Dist: retry
|
|
19
|
-
Requires-Dist: stem
|
|
20
|
-
Requires-Dist: pydrive2
|
|
21
|
-
Requires-Dist: undetected-chromedriver
|
|
22
|
-
Requires-Dist: pendulum
|
|
23
|
-
Requires-Dist: boto3
|
|
24
|
-
Requires-Dist: inflection
|
|
25
|
-
|
|
26
|
-
# DataMarket scraping core
|
|
27
|
-
|
|
28
|
-
------------------------------------------------------
|
|
29
|
-
[](https://github.com/psf/black)
|
|
30
|
-
|
|
31
|
-
|
|
32
|
-
Utilities that integrate advance scraping knowledge into just one library.
|
|
33
|
-
|
|
34
|
-
## Installation
|
|
35
|
-
|
|
36
|
-
To install this library in your Python environment:
|
|
37
|
-
|
|
38
|
-
`pip install datamarket`
|
|
39
|
-
|
|
40
|
-
## Documentation
|
|
41
|
-
|
|
42
|
-
This library has built functionalities for the following topics:
|
|
43
|
-
|
|
44
|
-
- **Databases**: through sqlalchemy it allows to insert records and perform queries in any database.
|
|
45
|
-
- **Proxies**: wide range of functions to perform HTTP requests through custom proxies or the Tor network.
|
|
46
|
-
- **Tinybird**: a Python client for this popular API.
|
|
47
|
-
- **Drive**: functions to upload, delete or authenticate to Google Drive.
|
|
48
|
-
- **FTP**: functions to upload, delete or authenticate to an FTP, SFTP or FTPS server.
|
|
49
|
-
- **Selenium**: wrapper for the main Selenium functions.
|
|
@@ -1,24 +0,0 @@
|
|
|
1
|
-
datamarket/__init__.py,sha256=FHS77P9qNewKMoN-p0FLEUEC60oWIYup1QkbJZP4ays,12
|
|
2
|
-
datamarket/interfaces/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
3
|
-
datamarket/interfaces/alchemy.py,sha256=V8E1GtokxUNmrUftKTFkIpNoXaqJME7ACES2BY0znQM,4214
|
|
4
|
-
datamarket/interfaces/aws.py,sha256=Mk9h-UcdbyNPUaYaG9wlKdd0R95xzTwtX1-_PgsBkjo,2084
|
|
5
|
-
datamarket/interfaces/drive.py,sha256=shbV5jpQVe_KPE-8Idx6Z9te5Zu1SmVfrvSAyd9ZIgE,2915
|
|
6
|
-
datamarket/interfaces/ftp.py,sha256=0Lf59uuGLVpGpnpMxRTnL0a1gPdL3zPMtb8NFyuKK28,1344
|
|
7
|
-
datamarket/interfaces/nominatim.py,sha256=3wbv3Ry2fcG4JNcWwl9FgfTfwHdd8Duwp7UaKK-rRE8,3655
|
|
8
|
-
datamarket/interfaces/peerdb.py,sha256=M2JmSpdJ0EGwow9G9ZHCzVLXOzc1zIgFh50SHrS6sFU,16760
|
|
9
|
-
datamarket/interfaces/proxy.py,sha256=vZ42V4zXBWkW7dTGpDvBMNL45MCHe1ZrYrF8xIY25GU,3367
|
|
10
|
-
datamarket/interfaces/tinybird.py,sha256=o4u-56sft-6Pow-ANkaM-Yga86KJTUgxyVfQJtfZCoY,2565
|
|
11
|
-
datamarket/params/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
12
|
-
datamarket/params/nominatim.py,sha256=pBYRfoBkkLBg2INbFymefmYSzaAVujQSpEro5c1hD_I,1143
|
|
13
|
-
datamarket/utils/__init__.py,sha256=8D5a8oKgqd6WA1RUkiKCn4l_PVemtyuckxQut0vDHXM,20
|
|
14
|
-
datamarket/utils/airflow.py,sha256=al0vc0YUikNu3Oy51VSn52I7pMU40akFBOl_UlHa2E4,795
|
|
15
|
-
datamarket/utils/alchemy.py,sha256=SRq6kgh1aANXVShBPgAuglmNhZssPWwWEY503gKSia8,635
|
|
16
|
-
datamarket/utils/main.py,sha256=HvoAR8JlDthJFINo8XeKhiMJ4zAyoToyBoT9DVmp8O8,2794
|
|
17
|
-
datamarket/utils/selenium.py,sha256=IMKlbLzXABFhACnWzhHmB0l2hhVzNwHGZwbo14nEewQ,2499
|
|
18
|
-
datamarket/utils/soda.py,sha256=eZTXFbI1P3WoMd1MM-YjoVTpdjTcDSWuvBb7ViBMhSQ,941
|
|
19
|
-
datamarket/utils/typer.py,sha256=FDF3l6gh3UlAFPsHCtesnekvct2rKz0oFn3uKARBQvE,814
|
|
20
|
-
datamarket-0.6.0.dist-info/LICENSE,sha256=OXLcl0T2SZ8Pmy2_dmlvKuetivmyPd5m1q-Gyd-zaYY,35149
|
|
21
|
-
datamarket-0.6.0.dist-info/METADATA,sha256=4zA9n3C-32eYrogoxRaKRb8wynSjp2lc5NukVrrwR80,1751
|
|
22
|
-
datamarket-0.6.0.dist-info/WHEEL,sha256=GV9aMThwP_4oNCtvEC2ec3qUYutgWeAzklro_0m4WJQ,91
|
|
23
|
-
datamarket-0.6.0.dist-info/top_level.txt,sha256=GmTOa8ryz1Oq1dUdiHHKhfSIl-_DVYNhZQmXy9xLo70,11
|
|
24
|
-
datamarket-0.6.0.dist-info/RECORD,,
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
datamarket
|
|
File without changes
|