Package Insights
((week_daily_avg - month_daily_avg) / month_daily_avg) * 100Weekly Downloads
GitHub Stars
Downloads by OS
Python Versions
Top Countries
Dependencies
- data-prep-toolkit >=0.2.3.dev0
66 optional dependencies
- colorlog[ray]
- data-prep-connector[web2parquet]
- data-prep-connector[all]
- data-prep-toolkit[doc-chunk]
- data-prep-toolkit[doc-id]
- data-prep-toolkit[doc-quality]
- data-prep-toolkit[ededup]
- data-prep-toolkit[hap]
- data-prep-toolkit[html2parquet]
- data-prep-toolkit[lang-id]
- data-prep-toolkit[ray]
- data-prep-toolkit[text-encoder]
- data-prep-toolkit[tokenization]
- data-prep-toolkit[web2parquet]
- data-prep-toolkit[all]
- deepsearch-glm[all]
- deepsearch-glm[pdf2parquet]
- docling[all]
- docling[pdf2parquet]
- docling-core[all]
- docling-core[doc-chunk]
- docling-core[pdf2parquet]
- docling-ibm-models[all]
- docling-ibm-models[pdf2parquet]
- emerge-viz[ray]
- fasttext[all]
- fasttext[lang-id]
- filetype[all]
- filetype[pdf2parquet]
- func-timeout[ray]
- huggingface-hub[all]
- huggingface-hub[lang-id]
- langcodes[all]
- langcodes[lang-id]
- llama-index-core[all]
- llama-index-core[doc-chunk]
- markupsafe[dev]
- mmh3[all]
- mmh3[ededup]
- moto[dev]
- networkx[ray]
- nltk[all]
- nltk[hap]
- numpy[all]
- numpy[lang-id]
- pandas[all]
- pandas[hap]
- pre-commit[dev]
- pydantic[all]
- pydantic[doc-chunk]
- pytest[dev]
- pytest-cov[dev]
- pytest-dotenv[dev]
- pytest-env[dev]
- pytest-mock[dev]
- sentence-transformers[all]
- sentence-transformers[text-encoder]
- torch[all]
- torch[hap]
- trafilatura[html2parquet]
- transformers[all]
- transformers[hap]
- transformers[tokenization]
- twine[dev]
- xxhash[all]
- xxhash[ededup]