Package Insights
Package Risks
- No releases in 624 days despite active commits
((week_daily_avg - month_daily_avg) / month_daily_avg) * 100Weekly Downloads
GitHub Stars
Downloads by OS
Python Versions
Top Countries
Dependencies
- backoff
- beautifulsoup4
- chardet
- dataclasses-json
- emoji
- filetype
- langdetect
- lxml
- nltk
- numpy <2
- psutil
- python-iso639
- python-magic
- rapidfuzz
- requests
- tabulate
- tqdm
- typing-extensions
- unstructured-client
- wrapt
151 optional dependencies
- adlfs[azure]
- astrapy[astra]
- atlassian-python-api[confluence]
- atlassian-python-api[jira]
- azure-search-documents[azure-cognitive-search]
- boto3[bedrock]
- boxfs[box]
- bs4[onedrive]
- bs4[biomed]
- bs4[gcs]
- chromadb[chroma]
- clarifai[clarifai]
- confluent-kafka[kafka]
- databricks-sdk[databricks-volumes]
- deltalake[delta-table]
- discord-py[discord]
- dropboxdrivefs[dropbox]
- effdet[image]
- effdet[pdf]
- effdet[all-docs]
- effdet[local-inference]
- elasticsearch[elasticsearch]
- fsspec[sftp]
- fsspec[azure]
- fsspec[box]
- fsspec[delta-table]
- fsspec[dropbox]
- fsspec[gcs]
- fsspec[s3]
- gcsfs[gcs]
- google-api-python-client[google-drive]
- google-cloud-vision[all-docs]
- google-cloud-vision[image]
- google-cloud-vision[local-inference]
- google-cloud-vision[pdf]
- htmlbuilder[notion]
- hubspot-api-client[hubspot]
- importlib-metadata[chroma]
- langchain[embed-voyageai]
- langchain[embed-vertexai]
- langchain-community[embed-vertexai]
- langchain-community[bedrock]
- langchain-google-vertexai[embed-vertexai]
- langchain-huggingface[embed-huggingface]
- langchain-openai[openai]
- langchain-voyageai[embed-voyageai]
- langdetect[huggingface]
- markdown[local-inference]
- markdown[all-docs]
- markdown[md]
- msal[onedrive]
- msal[sharepoint]
- msal[outlook]
- networkx[local-inference]
- networkx[xlsx]
- networkx[all-docs]
- notion-client[notion]
- office365-rest-python-client[outlook]
- office365-rest-python-client[onedrive]
- office365-rest-python-client[sharepoint]
- onnx[local-inference]
- onnx[all-docs]
- onnx[pdf]
- onnx[image]
- openai[embed-octoai]
- openpyxl[all-docs]
- openpyxl[xlsx]
- openpyxl[local-inference]
- opensearch-py[opensearch]
- pandas[xlsx]
- pandas[tsv]
- pandas[csv]
- pandas[all-docs]
- pandas[local-inference]
- paramiko[sftp]
- pdf2image[all-docs]
- pdf2image[image]
- pdf2image[local-inference]
- pdf2image[pdf]
- pdfminer-six[all-docs]
- pdfminer-six[image]
- pdfminer-six[pdf]
- pdfminer-six[local-inference]
- pikepdf[pdf]
- pikepdf[all-docs]
- pikepdf[image]
- pikepdf[local-inference]
- pillow-heif[image]
- pillow-heif[local-inference]
- pillow-heif[pdf]
- pillow-heif[all-docs]
- pinecone-client[pinecone]
- praw[reddit]
- psycopg2-binary[postgres]
- pyairtable[airtable]
- pygithub[github]
- pymongo[mongodb]
- pypandoc[rtf]
- pypandoc[rst]
- pypandoc[org]
- pypandoc[odt]
- pypandoc[local-inference]
- pypandoc[epub]
- pypandoc[all-docs]
- pypdf[all-docs]
- pypdf[local-inference]
- pypdf[image]
- pypdf[pdf]
- pytesseract[local-inference]
- pytesseract[all-docs]
- pytesseract[pdf]
- pytesseract[image]
- python-docx[doc]
- python-docx[docx]
- python-docx[local-inference]
- python-docx[odt]
- python-docx[all-docs]
- python-gitlab[gitlab]
- python-oxmsg[local-inference]
- python-oxmsg[all-docs]
- python-oxmsg[msg]
- python-pptx[local-inference]
- python-pptx[all-docs]
- python-pptx[ppt]
- python-pptx[pptx]
- qdrant-client[qdrant]
- s3fs[s3]
- sacremoses[huggingface]
- sentencepiece[huggingface]
- simple-salesforce[salesforce]
- singlestoredb[singlestore]
- slack-sdk[slack]
- tiktoken[embed-octoai]
- torch[huggingface]
- transformers[huggingface]
- typer[chroma]
- unstructured-inference[pdf]
- unstructured-inference[all-docs]
- unstructured-inference[image]
- unstructured-inference[local-inference]
- unstructured-paddleocr[paddleocr]
- unstructured-pytesseract[image]
- unstructured-pytesseract[local-inference]
- unstructured-pytesseract[pdf]
- unstructured-pytesseract[all-docs]
- urllib3[hubspot]
- weaviate-client[weaviate]
- wikipedia[wikipedia]
- xlrd[all-docs]
- xlrd[local-inference]
- xlrd[xlsx]