Package Insights
((week_daily_avg - month_daily_avg) / month_daily_avg) * 100Weekly Downloads
GitHub Stars
Downloads by OS
Python Versions
Top Countries
Dependencies
- beautifulsoup4 >=4.14.3
- deep-translator >=1.11.4
- gdown >=5.2.1
- lingua-language-detector >=2.2.0
- mineru >=2.7.6
- networkx >=3.6
- numpy >=2.4.2
- opencv-python >=4.13.0.92
- pandas >=2.3.3
- pillow >=11.3.0
- playwright ==1.58.0
- requests >=2.32.5
- torch >=2.10.0
- torchvision ==0.26.0
- transformers >=4.57.6
161 optional dependencies
- accelerate[dev]
- aiofiles[dev]
- aiohappyeyeballs[dev]
- aiohttp[dev]
- aiosignal[dev]
- albucore[dev]
- albumentations[dev]
- annotated-doc[dev]
- annotated-types[dev]
- antlr4-python3-runtime[dev]
- anyio[dev]
- attrs[dev]
- av[dev]
- beautifulsoup4[dev]
- boto3[dev]
- botocore[dev]
- brotli[dev]
- certifi[dev]
- cffi[dev]
- charset-normalizer[dev]
- click[dev]
- colorlog[dev]
- contourpy[dev]
- cryptography[dev]
- cycler[dev]
- datasets[dev]
- deep-translator[dev]
- dill[dev]
- distro[dev]
- doclayout-yolo[dev]
- einops[dev]
- fastapi[dev]
- fast-langdetect[dev]
- fasttext-predict[dev]
- ffmpy[dev]
- filelock[dev]
- flatbuffers[dev]
- fonttools[dev]
- frozenlist[dev]
- fsspec[dev]
- ftfy[dev]
- gdown[dev]
- gradio[dev]
- gradio-client[dev]
- gradio-pdf[dev]
- groovy[dev]
- h11[dev]
- hf-xet[dev]
- httpcore[dev]
- httpx[dev]
- httpx-retries[dev]
- huggingface-hub[dev]
- idna[dev]
- imageio[dev]
- jinja2[dev]
- jiter[dev]
- jmespath[dev]
- json-repair[dev]
- kiwisolver[dev]
- lazy-loader[dev]
- lingua-language-detector[dev]
- loguru[dev]
- magika[dev]
- markdown-it-py[dev]
- markupsafe[dev]
- matplotlib[dev]
- mdurl[dev]
- mineru[dev]
- mineru-vl-utils[dev]
- mlx[dev]
- mlx-lm[dev]
- mlx-metal[dev]
- mlx-vlm[dev]
- modelscope[dev]
- mpmath[dev]
- multidict[dev]
- multiprocess[dev]
- networkx[dev]
- numpy[dev]
- omegaconf[dev]
- onnxruntime[dev]
- openai[dev]
- opencv-python[dev]
- opencv-python-headless[dev]
- orjson[dev]
- packaging[dev]
- pandas[dev]
- pdfminer-six[dev]
- pdftext[dev]
- pillow[dev]
- polars[dev]
- polars-runtime-32[dev]
- propcache[dev]
- protobuf[dev]
- psutil[dev]
- pyarrow[dev]
- pyclipper[dev]
- pycparser[dev]
- py-cpuinfo[dev]
- pydantic[dev]
- pydantic-core[dev]
- pydantic-settings[dev]
- pydub[dev]
- pygments[dev]
- pyparsing[dev]
- pypdf[dev]
- pypdfium2[dev]
- pysocks[dev]
- python-dateutil[dev]
- python-dotenv[dev]
- python-multipart[dev]
- pytz[dev]
- pyyaml[dev]
- qwen-vl-utils[dev]
- regex[dev]
- reportlab[dev]
- requests[dev]
- rich[dev]
- robust-downloader[dev]
- ruff[dev]
- s3transfer[dev]
- safehttpx[dev]
- safetensors[dev]
- scikit-image[dev]
- scipy[dev]
- seaborn[dev]
- semantic-version[dev]
- sentencepiece[dev]
- setuptools[dev]
- shapely[dev]
- shellingham[dev]
- simsimd[dev]
- six[dev]
- sniffio[dev]
- soundfile[dev]
- soupsieve[dev]
- starlette[dev]
- stringzilla[dev]
- sympy[dev]
- thop[dev]
- tifffile[dev]
- timm[dev]
- tokenizers[dev]
- tomlkit[dev]
- torch[dev]
- tqdm[dev]
- transformers[dev]
- typer[dev]
- typing-extensions[dev]
- typing-inspection[dev]
- tzdata[dev]
- ultralytics[dev]
- ultralytics-thop[dev]
- urllib3[dev]
- uv[dev]
- uvicorn[dev]
- wcwidth[dev]
- websockets[dev]
- wheel[dev]
- xxhash[dev]
- yarl[dev]