Package Insights
((week_daily_avg - month_daily_avg) / month_daily_avg) * 100Weekly Downloads
GitHub Stars
Downloads by OS
Python Versions
Top Countries
Dependencies
- dill >=0.3.0
- fsspec >=2023.12.2
- huggingface-hub <1.0,>=0.34.0
- humanize
- loguru >=0.7.0
- multiprocess
- numpy >=2.0.0
- tqdm
57 optional dependencies
- aiofiles[inference]
- aiosqlite[inference]
- bitsandbytes[inference]
- botok[multilingual]
- datasets[io]
- datatrove[testing]
- datatrove[inference]
- datatrove[dev]
- datatrove[all]
- fasteners[processing]
- fasttext-numpy2-wheel[processing]
- faust-cchardet[io]
- flask[testing]
- ftfy[processing]
- httpx[inference]
- indic-nlp-library[multilingual]
- inscriptis[processing]
- jieba[multilingual]
- khmer-nltk[multilingual]
- kiwipiepy[multilingual]
- laonlp[multilingual]
- lighteval[decont]
- moto[testing]
- nltk[processing]
- numpy[inference]
- orjson[io]
- pandas[inference]
- pyahocorasick[processing]
- pyarrow[io]
- pyidaungsu-numpy2[multilingual]
- pytest[testing]
- pytest-rerunfailures[testing]
- pytest-timeout[testing]
- pytest-xdist[testing]
- pythainlp[multilingual]
- python-magic[io]
- pyvi[multilingual]
- pyyaml[inference]
- ray[ray]
- regex[processing]
- rich[cli]
- ruff[quality]
- s3fs[s3]
- sglang[inference]
- spacy[multilingual]
- stanza[multilingual]
- tensorflow[multilingual]
- tldextract[processing]
- tokenizers[processing]
- trafilatura[processing]
- transformers[inference]
- typer[inference]
- urduhack[multilingual]
- vllm[inference]
- warcio[io]
- xxhash[processing]
- zstandard[io]