pydoxtools

View on PyPIReverse Dependencies (0)

0.8.0 pydoxtools-0.8.0-py3-none-any.whl

Wheel Details

Project: pydoxtools
Version: 0.8.0
Filename: pydoxtools-0.8.0-py3-none-any.whl
Download: [link]
Size: 155867
MD5: a79e8cd0fe4f3e3e066c5e308d88f88e
SHA256: 91a9a3f9f095d7c2efcd91d8a403acefbd488d6bf17b1f04e79c6aa2bfb56f7c
Uploaded: 2024-01-28 21:47:02 +0000

dist-info

METADATA

Metadata-Version: 2.1
Name: pydoxtools
Version: 0.8.0
Summary: This library contains a set of tools in order to extract and synthesize structured information from documents
Author: thomas meschede
Author-Email: yeusblender[at]gmail.com
Home-Page: https://pydoxtools.xyntopia.com
Project-Url: Documentation, https://pydoxtools.xyntopia.com
Project-Url: Repository, https://github.com/xyntopia/pydoxtools
License: MIT
Keywords: AI,document-analysis,LLM,NLP,ML
Classifier: License :: OSI Approved :: MIT License
Classifier: Programming Language :: Python :: 3
Classifier: Programming Language :: Python :: 3.8
Classifier: Programming Language :: Python :: 3.9
Classifier: Programming Language :: Python :: 3.10
Classifier: Programming Language :: Python :: 3.11
Classifier: Programming Language :: Python :: 3.12
Requires-Python: >=3.8,<4.0
Requires-Dist: Pint (>=0.16.1)
Requires-Dist: Shapely (<2.0.0,>=1.8.0)
Requires-Dist: appdirs (<2.0.0,>=1.4.4)
Requires-Dist: beautifulsoup4 (>=4.8.0); extra == "etl" or extra == "inference"
Requires-Dist: chardet (<6.0.0,>=5.1.0)
Requires-Dist: dask[complete] (<2024.0.0,>=2023.4.1); extra == "etl"
Requires-Dist: diskcache (<6.0.0,>=5.6.1)
Requires-Dist: extruct (>=0.9.0); extra == "etl"
Requires-Dist: fastcoref (<3.0.0,>=2.1.6); extra == "inference"
Requires-Dist: goose3 (<4.0.0,>=3.1.6); extra == "etl"
Requires-Dist: gpt4all (<2.0.0,>=1.0.8); extra == "inference"
Requires-Dist: hnswlib (>=0.6.2); extra == "etl" or extra == "inference"
Requires-Dist: langdetect (<2.0.0,>=1.0.8); extra == "etl"
Requires-Dist: lxml (>=4.6.2)
Requires-Dist: networkx (<3.0.0,>=2.8.6); extra == "etl"
Requires-Dist: openai (<0.28.0,>=0.27.4); extra == "etl"
Requires-Dist: packaging (<24.0,>=23.0)
Requires-Dist: pandas (<3.0.0,>=2.0.1); extra == "etl" or extra == "inference"
Requires-Dist: pandoc (<3.0,>=2.4b0); extra == "etl"
Requires-Dist: pdf2image (<2.0.0,>=1.16.0); extra == "etl"
Requires-Dist: pdfminer.six (>=20200726); extra == "etl"
Requires-Dist: pikepdf (>=2.10.0)
Requires-Dist: pydantic (<3.0.0,>=2.0.0)
Requires-Dist: pydantic-settings (<3.0.0,>=2.1.0)
Requires-Dist: pygraphviz (<2.0,>=1.11); extra == "etl"
Requires-Dist: pytesseract (<0.4.0,>=0.3.10); extra == "etl"
Requires-Dist: python-magic (<0.5.0,>=0.4.27)
Requires-Dist: python-pptx (<0.7.0,>=0.6.21); extra == "etl"
Requires-Dist: pytorch-lightning (>=1.5.6); extra == "inference"
Requires-Dist: pyyaml (<7.0,>=6.0)
Requires-Dist: quantities (>=0.12.4); extra == "etl"
Requires-Dist: quantulum3 (>=0.7.4); extra == "etl"
Requires-Dist: readability-lxml (<0.9.0,>=0.8.1); extra == "etl"
Requires-Dist: scikit-learn (<2.0.0,>=1.0.2); extra == "inference"
Requires-Dist: spacy (<4.0.0,>=3.7.0); extra == "etl" or extra == "inference"
Requires-Dist: stemming (>=1.0.1); extra == "etl"
Requires-Dist: tabulate (<0.10.0,>=0.9.0)
Requires-Dist: timm (<0.10.0,>=0.9.5); extra == "inference"
Requires-Dist: tldextract (>=2.2.3); extra == "etl"
Requires-Dist: torch (!=2.0.1,>=1.12.1); extra == "inference"
Requires-Dist: tqdm (>=4.47.0); extra == "inference"
Requires-Dist: transformers (>=4.17.0); extra == "inference"
Requires-Dist: urlextract (>=1.1.0); extra == "etl" or extra == "inference"
Provides-Extra: etl
Provides-Extra: inference
Description-Content-Type: text/markdown
[Description omitted; length: 11005 characters]

WHEEL

Wheel-Version: 1.0
Generator: poetry-core 1.8.1
Root-Is-Purelib: true
Tag: py3-none-any

RECORD

Path Digest Size
pydoxtools/__init__.py sha256=24-F0RzQhDyA64UtreE162rywO1coUSU2pxubiQwrNU 325
pydoxtools/class_utils.py sha256=qoCS_xn68JB4_QjZmfgsldx5MzWqStquCqUONq7mC_o 2501
pydoxtools/classifier.py sha256=CqnrGnzGinq0ri30MJyzw2GP5soGaWfwIW2OUTWX2x8 30412
pydoxtools/cluster_utils.py sha256=0vwSdJpTB2BMcpMOPki5sxkvwhdg3Qg_CsdXc_5WC88 29768
pydoxtools/dask_operators.py sha256=q0Tkt-dPo_L9iT3WTiNVqEO_BznXQUac4F0fX3S5Stc 6137
pydoxtools/document.py sha256=dQihkDYTEq2Rgi84_5yDiSVUXJvOD_MndX4cruseQhw 69298
pydoxtools/document_base.py sha256=PlsHAMV5Fl_KRu1jlIdRrCO-8Y0vlhg5awHnnRDvFv0 44358
pydoxtools/extract_classes.py sha256=zMmI6P0RK6tjim4OZB4Ut0Si4yDy5_MgmJmK5HuVLE8 3654
pydoxtools/extract_filesystem.py sha256=OrGNJoVZUeLsDleZn8ly5hoJCn9GYEM6ifAk96MDcdY 4065
pydoxtools/extract_html.py sha256=XhGsIBkxkwd8cofb-UX98TclvtnsEJu-k_bvsdSpNAs 13396
pydoxtools/extract_index.py sha256=gteGQQfyZT7tts2xjWTBLem53gxpxu1NIZTlwHMSF_A 7628
pydoxtools/extract_nlpchat.py sha256=5v85AoP6lEfKdnep7YyzvUYcwTUUWuNGlM34PuUFjF0 9815
pydoxtools/extract_objects.py sha256=tNO9BLPR8ay1w_SVFLzqPmHx0OzSfXmO8OyzOxNUUcQ 2561
pydoxtools/extract_ocr.py sha256=fP8t9CWIyS-zxK9PULHJriNknMxZcYMb04yOA_kaowQ 1750
pydoxtools/extract_pandoc.py sha256=OHzLqkIu8akYJu-IB7qOFOBn-ogeKZ0VSKntrF-B8GE 6475
pydoxtools/extract_spacy.py sha256=NkJDT3_BkBihMryNzSoyfYYTlpnMdRUskALr95cYItg 14202
pydoxtools/extract_tables.py sha256=Zmcg7lXxZk4N69FwcqByZrY7zkp783vAjD_cypGsnLA 53832
pydoxtools/extract_textstructure.py sha256=b0vgfbr-ieappCt1zeLPCYUaCtySPZ9N45BGWZvBnvU 18252
pydoxtools/file_utils.py sha256=Oz5YkBldg6rtOFTslSX45ieJYsNi6QTKquh_fj0ReDc 1324
pydoxtools/gui.py sha256=PHEp-01MK8pmgWtc3CG6HN9N5KKzt_BUlXOyvUC9e8E 204
pydoxtools/html_utils.py sha256=DTOCufA6Q6tKs6UnPXU7nkmGO8id_K7-wwpUgzfIQPs 6187
pydoxtools/labeling.py sha256=oXOnzChIRxgmBeJ8xNkEvZ5DLXGlI2m3HdUr3ho04F4 7167
pydoxtools/list_utils.py sha256=ZzBhaAV7OfDwlgOiduf0K3Q9_OJGp8fCPb0fSwHqKNc 7609
pydoxtools/math_utils.py sha256=A6idBVZWOl85vSOi9F2dHKNmecLao-wRHJYnlycbIcA 466
pydoxtools/models.py sha256=vEcTU0NSbQehXvrp_9UGbIL4vyDekKU0pMHzJKsqcRU 2586
pydoxtools/nlp_utils.py sha256=KK3zZbp7A6MLJdqImBmWO3NbpyTuNVXSQ934zPRHDq0 18805
pydoxtools/ocr_language_mappings.py sha256=bOqxCm6AGiT_UxsR73Mqn0eqdFLUpIqbIGKk6BPl9es 2504
pydoxtools/operator_huggingface.py sha256=jDXCUZ-xhyyWmgby1NYr8gG_5jxcQAfAKG5duj38iws 8962
pydoxtools/operators_base.py sha256=BcOAKbIW2rU_nS65e_jZF4d-7XJTt14M2wop_ssHDWM 15041
pydoxtools/pdf_utils.py sha256=vmjLk8XVzgtbzEJ3MC_oVLVBklmxF5FfBv6SI8z8f7E 16719
pydoxtools/random_data_generators.py sha256=Svu41SnN5-3c_9_N7sQrkBWcTwhY5meUcQf6KUSbE7o 34121
pydoxtools/settings.py sha256=oj4nIT6miQZ3smZ_BG4E6fEHbEzUdE_xEQ1miJlqFzo 1425
pydoxtools/training.py sha256=dJzjqMhVabFWfFnd8A0TrChcxNbdmLjTmAxLOOI4NtE 17775
pydoxtools/visual_document_analysis.py sha256=DKYUInMFtrCdiD4zDp7fpnI52Vifv5sVKnA1eBBO_As 5742
pydoxtools/visualization.py sha256=LllhDCCo2d60h9_4OJimMTxG4MFX9-sKuRycvna0N9A 7351
pydoxtools/webdav_utils.py sha256=OMD1O5zAfkfnhvDQMPiPZ51RLBAllETprClhiflhzto 3301
pydoxtools-0.8.0.dist-info/LICENSE sha256=QAhzgyR5OoTzH976zZvlSHrzquahWjYZ0LX2xE_Q3KM 1072
pydoxtools-0.8.0.dist-info/METADATA sha256=cg7T59NAWgkTNlWSJWaG9KpSTiDUItRY9UDSZzIcoqE 14335
pydoxtools-0.8.0.dist-info/WHEEL sha256=FMvqSimYX_P7y0a7UY-_Mc83r5zkBZsCYPm7Lr0Bsq4 88
pydoxtools-0.8.0.dist-info/entry_points.txt sha256=UegCYOipgvGbeQQriEtFxTCOGHb0C3whIH9GgKhgMys 57
pydoxtools-0.8.0.dist-info/RECORD

entry_points.txt

clone-data = clone_data:clone_submodule