unstructured-ingest 0.0.18__py3-none-any.whl → 0.0.21__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (27) hide show
  1. unstructured_ingest/__version__.py +1 -1
  2. unstructured_ingest/cli/cmds/astradb.py +2 -2
  3. unstructured_ingest/connector/astradb.py +54 -24
  4. unstructured_ingest/v2/processes/chunker.py +8 -29
  5. unstructured_ingest/v2/processes/connectors/astradb.py +26 -19
  6. unstructured_ingest/v2/processes/connectors/chroma.py +2 -5
  7. unstructured_ingest/v2/processes/connectors/databricks_volumes.py +12 -14
  8. unstructured_ingest/v2/processes/connectors/fsspec/azure.py +1 -6
  9. unstructured_ingest/v2/processes/connectors/fsspec/box.py +1 -6
  10. unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py +2 -5
  11. unstructured_ingest/v2/processes/connectors/fsspec/gcs.py +1 -6
  12. unstructured_ingest/v2/processes/connectors/fsspec/s3.py +1 -6
  13. unstructured_ingest/v2/processes/connectors/kdbai.py +2 -5
  14. unstructured_ingest/v2/processes/connectors/local.py +2 -5
  15. unstructured_ingest/v2/processes/connectors/milvus.py +2 -5
  16. unstructured_ingest/v2/processes/connectors/mongodb.py +2 -5
  17. unstructured_ingest/v2/processes/connectors/pinecone.py +2 -5
  18. unstructured_ingest/v2/processes/connectors/sql.py +1 -6
  19. unstructured_ingest/v2/processes/connectors/weaviate.py +2 -5
  20. unstructured_ingest/v2/processes/partitioner.py +9 -55
  21. unstructured_ingest/v2/unstructured_api.py +87 -0
  22. {unstructured_ingest-0.0.18.dist-info → unstructured_ingest-0.0.21.dist-info}/METADATA +369 -369
  23. {unstructured_ingest-0.0.18.dist-info → unstructured_ingest-0.0.21.dist-info}/RECORD +27 -26
  24. {unstructured_ingest-0.0.18.dist-info → unstructured_ingest-0.0.21.dist-info}/LICENSE.md +0 -0
  25. {unstructured_ingest-0.0.18.dist-info → unstructured_ingest-0.0.21.dist-info}/WHEEL +0 -0
  26. {unstructured_ingest-0.0.18.dist-info → unstructured_ingest-0.0.21.dist-info}/entry_points.txt +0 -0
  27. {unstructured_ingest-0.0.18.dist-info → unstructured_ingest-0.0.21.dist-info}/top_level.txt +0 -0
@@ -1,5 +1,5 @@
1
1
  unstructured_ingest/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
2
- unstructured_ingest/__version__.py,sha256=bJ5C3mWqhuWY5BAH5bAUzjjkW54gcd2KffrdBiGTVK0,43
2
+ unstructured_ingest/__version__.py,sha256=jKsHPdCiaS4Mdql3-_XwS3BGWgrosIEEQ7-K8uTyviU,43
3
3
  unstructured_ingest/error.py,sha256=qDncnJgbf5ils956RcO2CGlAKYDT5OaEM9Clv1JVTNc,1448
4
4
  unstructured_ingest/interfaces.py,sha256=LuY-85clq5iyOtDd9vDABjK2MZCm6wRWK53cdb4SROY,31411
5
5
  unstructured_ingest/logger.py,sha256=S5nSqGcABoQyeicgRnBQFjDScCaTvFVivOCvbo-laL0,4479
@@ -17,7 +17,7 @@ unstructured_ingest/cli/base/dest.py,sha256=uN44l7kPErm_BQqKFUgaiz_Xu6UKk-mnB1B8
17
17
  unstructured_ingest/cli/base/src.py,sha256=gDLZlBuOCEGMAAFCLkoURFQKmrmE34WQ5DbT0w1ssy4,2179
18
18
  unstructured_ingest/cli/cmds/__init__.py,sha256=TtVhAdlPv7e1DKYZ_D2q0wauE-1IjF-AtHp0RIskoD8,5932
19
19
  unstructured_ingest/cli/cmds/airtable.py,sha256=SgdUztUCFbabWP3K937TwdYlhrdY2PUtE4TXUHfBGtw,2629
20
- unstructured_ingest/cli/cmds/astradb.py,sha256=T5Ccz29BDNewuHlL1PN5MDnBggQ93o2lGZgxDgTNtys,2931
20
+ unstructured_ingest/cli/cmds/astradb.py,sha256=2subkQvVHOxSs98Zu3bPKtIUl-uzjNEMarcYQaPYCh0,2929
21
21
  unstructured_ingest/cli/cmds/azure_cognitive_search.py,sha256=PcM55PtpRMHbP69trW0JCTz-gx6tKMLUaMU4GGXv0g8,1927
22
22
  unstructured_ingest/cli/cmds/biomed.py,sha256=M2jc7_-EvbAeDtDwtZNrPI48QJ1Tm401LcSUD0Ayd20,1442
23
23
  unstructured_ingest/cli/cmds/chroma.py,sha256=zO17L7LgUaDfKutfQjSE-QjZJcREyeSpWZetja243lE,3267
@@ -59,7 +59,7 @@ unstructured_ingest/cli/cmds/fsspec/s3.py,sha256=v-24oFxhabdShryK2dhP4cDBvVyoQ-8
59
59
  unstructured_ingest/cli/cmds/fsspec/sftp.py,sha256=TCB7sf_GYoifryQbbttknYSt9Q1kRCPtu8B8QgXl3lw,1537
60
60
  unstructured_ingest/connector/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
61
61
  unstructured_ingest/connector/airtable.py,sha256=KcLt-FEabO9D5ev5E4xUf06VYHpYpypP-adTVyhGcb8,10585
62
- unstructured_ingest/connector/astradb.py,sha256=kDDcITwmUqgZ2y0cYMxMIsEr3c7s8SXrRI1LplTRlos,8635
62
+ unstructured_ingest/connector/astradb.py,sha256=jU2rS5Xips6eNNrHvNIxIYD-2u7wwPzW08aMc5NKZOE,9814
63
63
  unstructured_ingest/connector/azure_cognitive_search.py,sha256=cqQdAaEzt4coU7sxnl4GY8Em4a6azFLyAKM6enkmjBA,5850
64
64
  unstructured_ingest/connector/biomed.py,sha256=uwtBuKzpHfxbJckHAHcsnKo4dTCdag66tCDtCqKNSZM,10847
65
65
  unstructured_ingest/connector/chroma.py,sha256=Nma6HebQxNY7CCWwWArkX3kMXf2xVv6L-jrfRjMi9LE,5713
@@ -265,6 +265,7 @@ unstructured_ingest/v2/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LG
265
265
  unstructured_ingest/v2/logger.py,sha256=wcln4s5Nyp2fjjJux9iM3d6t9aQFNJ2H1IAZXmIknjI,4323
266
266
  unstructured_ingest/v2/main.py,sha256=WFdLEqEXRy6E9_G-dF20MK2AtgX51Aan1sp_N67U2B8,172
267
267
  unstructured_ingest/v2/otel.py,sha256=2fGj1c7cVcC3J8NwL6MNYhyPEAXiB33DsilvRDkrdLo,4130
268
+ unstructured_ingest/v2/unstructured_api.py,sha256=1EQVuL-TojmFxWoWFzXr1oCFPEC3IkCQqhjXM8spdTY,3373
268
269
  unstructured_ingest/v2/utils.py,sha256=9LnhpI8Otpq5HPcN2Dtkp7APD_euq1ylKhIsybuK99Y,1714
269
270
  unstructured_ingest/v2/cli/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
270
271
  unstructured_ingest/v2/cli/cli.py,sha256=qHXIs-PcvMgDZhP1AR9iDMxh8FXBMJCEDksPBfiMULE,648
@@ -301,46 +302,46 @@ unstructured_ingest/v2/pipeline/steps/stage.py,sha256=ZvP-Rz_A5UkhZNoRUvVgciJbGX
301
302
  unstructured_ingest/v2/pipeline/steps/uncompress.py,sha256=pEu7VU27Fuu53eqBddAmXihV74A6JTwTfnjKeb__edY,1745
302
303
  unstructured_ingest/v2/pipeline/steps/upload.py,sha256=G9z8QQe9b_WokI5qyr4UOOqaepEVgwFqMn9pWcta9gI,1917
303
304
  unstructured_ingest/v2/processes/__init__.py,sha256=FaHWSCGyc7GWVnAsNEUUj7L8hT8gCVY3_hUE2VzWtUg,462
304
- unstructured_ingest/v2/processes/chunker.py,sha256=W2qPIddT-QEhHTKpA1krUhBrR0UFOq4nuko2eBjlG_I,6675
305
+ unstructured_ingest/v2/processes/chunker.py,sha256=76PrpCSd8k3DpfdZcl8I10u7vciKzhSV9ZByrrp302g,5476
305
306
  unstructured_ingest/v2/processes/connector_registry.py,sha256=vkEe6jpgdYtZCxMj59s5atWGgmPuxAEXRUoTt-MJ7wc,2198
306
307
  unstructured_ingest/v2/processes/embedder.py,sha256=ZBCIm0oHxWmtUEQYyAjXACqTYPt3LnvXLtoFhu6mu8A,6077
307
308
  unstructured_ingest/v2/processes/filter.py,sha256=kjUmMw2SDq2bme0JCAOxs6cJriIG6Ty09KOznS-xz08,2145
308
- unstructured_ingest/v2/processes/partitioner.py,sha256=KyWCo7qOQb1wyU8GJ2krejWSNE1vWRHvhEl1V_oDEU8,10040
309
+ unstructured_ingest/v2/processes/partitioner.py,sha256=bpqmZDsKKi6qtxNWdIWBfQmr1ccQUhU0axecpGAUf_4,7739
309
310
  unstructured_ingest/v2/processes/uncompress.py,sha256=Z_XfsITGdyaRwhtNUc7bMj5Y2jLuBge8KoK4nxhqKag,2425
310
311
  unstructured_ingest/v2/processes/connectors/__init__.py,sha256=6iBdoH6BW8oMK1ZvEi0IgEchuk0cNUPoNIaikpzeML8,4992
311
312
  unstructured_ingest/v2/processes/connectors/airtable.py,sha256=LLz3qVhbcZrHXeK1xu8lywj828wsDwYDfSsaNB2CwrA,8915
312
- unstructured_ingest/v2/processes/connectors/astradb.py,sha256=bjlzJVNANnpTxRm8Ba8ZS0KetJ_yxmEyEoPJDwUkcOw,5774
313
+ unstructured_ingest/v2/processes/connectors/astradb.py,sha256=ZctZRfXcOAMBGPkKgHvhTmV_-2F0YN5vqwfY9UCHIlU,5791
313
314
  unstructured_ingest/v2/processes/connectors/azure_cognitive_search.py,sha256=S55v7TXu30rEdgythMBB_2VcuomyMPmcPtLYykbhw_E,8466
314
- unstructured_ingest/v2/processes/connectors/chroma.py,sha256=HRIHZSflSIRpVlLhXl_RLrmskESbAYait3TDBLS1fgU,8099
315
+ unstructured_ingest/v2/processes/connectors/chroma.py,sha256=skrxRPHZ8y3JxNa0dt5SVitHiDQ5WVxLvY_kh2-QUrQ,8029
315
316
  unstructured_ingest/v2/processes/connectors/couchbase.py,sha256=SONLywyEfoAlLc-HPabXeGzoiwKnekMHIbRMXd4CGXs,12146
316
- unstructured_ingest/v2/processes/connectors/databricks_volumes.py,sha256=K0Sjt57vsVxL2eImqHzu7LnAONPUVTcDw2-hdLcWjV0,5984
317
+ unstructured_ingest/v2/processes/connectors/databricks_volumes.py,sha256=c5rVY2vrqJw3vINExMhFoANnjBCVnYil0Jm97u_WJ7g,6024
317
318
  unstructured_ingest/v2/processes/connectors/elasticsearch.py,sha256=H8svPr-Yk3UniHT1O9kUd2QhTfrJdzbqRNLFZIMiITQ,16750
318
319
  unstructured_ingest/v2/processes/connectors/google_drive.py,sha256=7xOQthcqBd9auJxB0nxZlhh1vdjXpMX_CtQZa6YfZz0,13088
319
- unstructured_ingest/v2/processes/connectors/kdbai.py,sha256=vF-Owg2ZDI4nC7sk-Ied-5o_qkfwJzDr3uztOeS8kC0,5653
320
- unstructured_ingest/v2/processes/connectors/local.py,sha256=PdXWzkiXHqCaQq7M06LmcCabg0mRPmaIOET7LA5BwLc,6806
321
- unstructured_ingest/v2/processes/connectors/milvus.py,sha256=uF93R9V_tkCQ9XRUEiwMTYdR3vgH9dH9SWJgkaY6Nbw,7761
322
- unstructured_ingest/v2/processes/connectors/mongodb.py,sha256=q_GRuG2RQ5-8ajefifKuhFO52wCVhtU9j4ZIEf5hNas,4948
320
+ unstructured_ingest/v2/processes/connectors/kdbai.py,sha256=D71gt8fsPOXi2-Rir8mATw6dRM3BdzYGnn62qG1iaBw,5586
321
+ unstructured_ingest/v2/processes/connectors/local.py,sha256=a3stgnIkhBbXPIQD0O-RaRM-Eb-szHj9Yy4Fz881-9c,6723
322
+ unstructured_ingest/v2/processes/connectors/milvus.py,sha256=oJCsCHgbMSKZ8AphU_vO_R_4OmGv9Nm7gFdNDUmcu7E,7675
323
+ unstructured_ingest/v2/processes/connectors/mongodb.py,sha256=2_R_hrEAaTU4vJTCK9oKblWTgv6BKjyUhFtC7uq3q2w,4859
323
324
  unstructured_ingest/v2/processes/connectors/onedrive.py,sha256=ZiUo-dFo1LMOvFwphSLRZiR1PcrN8GWLTHhsh4TU6n0,9207
324
325
  unstructured_ingest/v2/processes/connectors/opensearch.py,sha256=PNkJGLCCkwxLvxKX6vF_0jy-LC4wKu8PCXzmULEo9sk,6755
325
- unstructured_ingest/v2/processes/connectors/pinecone.py,sha256=slIvM5i7_u-LDlNJF-i9oV_1EcKFKuoTaGDRyhZ4p20,6840
326
+ unstructured_ingest/v2/processes/connectors/pinecone.py,sha256=gCueI1Px7UkI1flNovLMRvcbPGczHI3IlYhOPYlb3WU,6748
326
327
  unstructured_ingest/v2/processes/connectors/salesforce.py,sha256=2CiO2ZZiZ1Y1-nB7wcDlDVcpW2B7ut9wCj66rkkqho0,11616
327
328
  unstructured_ingest/v2/processes/connectors/sharepoint.py,sha256=hOaV5gBcHFc6N5Rbu3MgM-5Aol1ht-QkNIN4PqjvfxE,19665
328
329
  unstructured_ingest/v2/processes/connectors/singlestore.py,sha256=4rVvWKK2iQr03Ff6cB5zjfE1MpN0JyIGpCxxFCDI6hc,5563
329
- unstructured_ingest/v2/processes/connectors/sql.py,sha256=tDWL3YqL8MQuLsjW8A-KUkpSLh1iOn934OWfzPkqils,9298
330
+ unstructured_ingest/v2/processes/connectors/sql.py,sha256=srj2ECKnkGR_iEFBdpa8sxw3ACCvJ5L0uoKCuHxKUe4,9204
330
331
  unstructured_ingest/v2/processes/connectors/utils.py,sha256=8kd0g7lo9NqnpaIkjeO-Ut6erhwUNH_gS9koevpe3WE,878
331
- unstructured_ingest/v2/processes/connectors/weaviate.py,sha256=4hBQ9GWbBv6ti9futVJCShNugDC6Vh7Hy9ZhEC4XDpM,8958
332
+ unstructured_ingest/v2/processes/connectors/weaviate.py,sha256=Ss0YyD5T6k-00eJ6dr5lSo2H0LcOjVTMmozehyTvnAo,8866
332
333
  unstructured_ingest/v2/processes/connectors/fsspec/__init__.py,sha256=TtdeImM7Ypl_n6sl7I1JqX6bGSG0t_FqvCqE3Cy24og,1846
333
- unstructured_ingest/v2/processes/connectors/fsspec/azure.py,sha256=GrC44PnA8PLHUJQ4aH3gETxL8v8UvknbKptxiXweqdc,6214
334
- unstructured_ingest/v2/processes/connectors/fsspec/box.py,sha256=JgSgF7f4UOx_JUV8zghgykyBA4rKvqkErRm6zYXO1XA,4434
335
- unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py,sha256=ZnoSGAZ4wtOhyg8G3PLYFMpbMVsBffvW-qp5jWwEDuA,4775
334
+ unstructured_ingest/v2/processes/connectors/fsspec/azure.py,sha256=dzOuy1RuozGnCCFJ6CiE3brijcv5WHBnUVVJXx75bks,6057
335
+ unstructured_ingest/v2/processes/connectors/fsspec/box.py,sha256=_yOII2D1zCnI-ae_G7Fx7lb5GuTiaELIHtIyfeDOKGE,4343
336
+ unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py,sha256=pjDsOVf-a3ERBL3PVop7fI8wIrJc4-51CHzolivLwY8,4686
336
337
  unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py,sha256=Ri1TscAbQyIb3QZXDIC3vYJyGRgFWAOrzaQsngsCl-Q,12785
337
- unstructured_ingest/v2/processes/connectors/fsspec/gcs.py,sha256=O1j0hIYWI4lPpTQ5hsEKV8usDCrUm-t1qVcSNKsJQd0,6006
338
- unstructured_ingest/v2/processes/connectors/fsspec/s3.py,sha256=cOMvMh0C9rtyEPJ0X59Fn-qb11LFUMRfeUgsi3QRWUk,6390
338
+ unstructured_ingest/v2/processes/connectors/fsspec/gcs.py,sha256=eKcFYwnUNr3TwEGyriV9lvXRo9AZEOw_dvVyibVD0dM,5915
339
+ unstructured_ingest/v2/processes/connectors/fsspec/s3.py,sha256=UfI4MxUd74K0i1odJx9KZOfJtvwixL6n2DWvhLOgkfo,6302
339
340
  unstructured_ingest/v2/processes/connectors/fsspec/sftp.py,sha256=NkcU4U2DQWWuM8UHkez67C3SEOZpVyRtmtNS-z-F0Fw,6056
340
341
  unstructured_ingest/v2/processes/connectors/fsspec/utils.py,sha256=jec_Qfe2hbfahBuY-u8FnvHuv933AI5HwPFjOL3kEEY,456
341
- unstructured_ingest-0.0.18.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
342
- unstructured_ingest-0.0.18.dist-info/METADATA,sha256=rKqUHDyuaADzZishCNkNG8JlnkxswaTljDIBPzAs7_Q,28507
343
- unstructured_ingest-0.0.18.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
344
- unstructured_ingest-0.0.18.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
345
- unstructured_ingest-0.0.18.dist-info/top_level.txt,sha256=QaTxTcjfM5Hr9sZJ6weOJvSe5ESQc0F8AWkhHInTCf8,20
346
- unstructured_ingest-0.0.18.dist-info/RECORD,,
342
+ unstructured_ingest-0.0.21.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
343
+ unstructured_ingest-0.0.21.dist-info/METADATA,sha256=0LbQTW5dTus7hdY_JkPxbeOitzVoAgzQy0ikdF48Sc0,28507
344
+ unstructured_ingest-0.0.21.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
345
+ unstructured_ingest-0.0.21.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
346
+ unstructured_ingest-0.0.21.dist-info/top_level.txt,sha256=QaTxTcjfM5Hr9sZJ6weOJvSe5ESQc0F8AWkhHInTCf8,20
347
+ unstructured_ingest-0.0.21.dist-info/RECORD,,