Package Insights
((week_daily_avg - month_daily_avg) / month_daily_avg) * 100Weekly Downloads
GitHub Stars
Downloads by OS
Python Versions
Top Countries
Dependencies
- beautifulsoup4 <5.0.0,>=4.14.3
- charset-normalizer <4.0.0,>=3.4.4
- emoji <3.0.0,>=2.15.0
- filelock <4.0.0,>=3.12.0
- filetype <2.0.0,>=1.2.0
- html5lib <2.0.0,>=1.1
- installer <1.0.0,>=0.7.0
- langdetect <2.0.0,>=1.0.9
- lxml <7.0.0,>=5.0.0
- numba <1.0.0,>=0.60.0
- numpy <3.0.0,>=1.26.0
- psutil <8.0.0,>=7.2.2
- python-iso639 <2027.0.0,>=2026.1.31
- python-magic <1.0.0,>=0.4.27
- python-oxmsg <1.0.0,>=0.0.2
- rapidfuzz <4.0.0,>=3.14.3
- regex <2027.0.0,>=2024.0.0
- requests <3.0.0,>=2.32.5
- spacy <4.0.0,>=3.7.0
- tqdm <5.0.0,>=4.67.3
- typing-extensions <5.0.0,>=4.15.0
- unstructured-client <1.0.0,>=0.25.9
- wrapt <3.0.0,>=2.1.1
78 optional dependencies
- google-cloud-vision[local-inference]
- google-cloud-vision[all-docs]
- google-cloud-vision[image]
- google-cloud-vision[pdf]
- markdown[all-docs]
- markdown[local-inference]
- markdown[md]
- msoffcrypto-tool[all-docs]
- msoffcrypto-tool[xlsx]
- msoffcrypto-tool[local-inference]
- networkx[xlsx]
- networkx[all-docs]
- networkx[local-inference]
- openai-whisper[all-docs]
- openai-whisper[local-inference]
- openai-whisper[audio]
- openpyxl[all-docs]
- openpyxl[local-inference]
- openpyxl[xlsx]
- paddlepaddle[paddleocr]
- pandas[xlsx]
- pandas[all-docs]
- pandas[csv]
- pandas[local-inference]
- pandas[tsv]
- pdf2image[local-inference]
- pdf2image[pdf]
- pdf2image[image]
- pdf2image[all-docs]
- pdfminer-six[image]
- pdfminer-six[all-docs]
- pdfminer-six[pdf]
- pdfminer-six[local-inference]
- pi-heif[local-inference]
- pi-heif[pdf]
- pi-heif[all-docs]
- pi-heif[image]
- pikepdf[local-inference]
- pikepdf[all-docs]
- pikepdf[image]
- pikepdf[pdf]
- pypandoc-binary[epub]
- pypandoc-binary[rtf]
- pypandoc-binary[rst]
- pypandoc-binary[org]
- pypandoc-binary[odt]
- pypandoc-binary[all-docs]
- pypandoc-binary[local-inference]
- pypdf[image]
- pypdf[all-docs]
- pypdf[pdf]
- pypdf[local-inference]
- python-docx[doc]
- python-docx[odt]
- python-docx[all-docs]
- python-docx[local-inference]
- python-docx[docx]
- python-pptx[ppt]
- python-pptx[local-inference]
- python-pptx[pptx]
- python-pptx[all-docs]
- sentencepiece[huggingface]
- tiktoken[chunking-tokens]
- torch[huggingface]
- transformers[huggingface]
- unstructured-inference[local-inference]
- unstructured-inference[pdf]
- unstructured-inference[all-docs]
- unstructured-inference[image]
- unstructured-ingest[ingest]
- unstructured-paddleocr[paddleocr]
- unstructured-pytesseract[image]
- unstructured-pytesseract[all-docs]
- unstructured-pytesseract[local-inference]
- unstructured-pytesseract[pdf]
- xlrd[all-docs]
- xlrd[local-inference]
- xlrd[xlsx]