Spaces:
Running
Running
[tool.poetry] | |
name = "surya-ocr" | |
version = "0.6.1" | |
description = "OCR, layout, reading order, and table recognition in 90+ languages" | |
authors = ["Vik Paruchuri <[email protected]>"] | |
readme = "README.md" | |
license = "GPL-3.0-or-later" | |
repository = "https://github.com/VikParuchuri/surya" | |
keywords = ["ocr", "pdf", "text detection", "text recognition", "tables"] | |
packages = [ | |
{include = "surya"} | |
] | |
include = [ | |
"detect_text.py", | |
"ocr_text.py", | |
"ocr_app.py", | |
"run_ocr_app.py", | |
"detect_layout.py", | |
"reading_order.py", | |
"table_recognition.py" | |
] | |
[tool.poetry.dependencies] | |
python = ">=3.9,<3.13,!=3.9.7" | |
transformers = "^4.41.0" | |
torch = "^2.3.0" | |
pydantic = "^2.5.3" | |
pydantic-settings = "^2.1.0" | |
python-dotenv = "^1.0.0" | |
pillow = "^10.2.0" | |
pypdfium2 = "^4.25.0" | |
opencv-python = "^4.9.0.80" | |
tabulate = "^0.9.0" | |
filetype = "^1.2.0" | |
ftfy = "^6.1.3" | |
pdftext = "^0.3.12" | |
[tool.poetry.group.dev.dependencies] | |
jupyter = "^1.0.0" | |
pytesseract = "^0.3.10" | |
pymupdf = "^1.23.8" | |
snakeviz = "^2.2.0" | |
datasets = "^2.16.1" | |
rapidfuzz = "^3.6.1" | |
arabic-reshaper = "^3.0.0" | |
streamlit = "^1.31.0" | |
playwright = "^1.41.2" | |
[tool.poetry.scripts] | |
surya_detect = "detect_text:main" | |
surya_ocr = "ocr_text:main" | |
surya_layout = "detect_layout:main" | |
surya_gui = "run_ocr_app:run_app" | |
surya_order = "reading_order:main" | |
surya_table = "table_recognition:main" | |
[build-system] | |
requires = ["poetry-core"] | |
build-backend = "poetry.core.masonry.api" | |