[project] name = "surya-ocr" version = "0.20.0" description = "OCR, layout, reading order, and table recognition in 90+ languages." readme = "README.md" license = { text = "Apache-2.0" } authors = [ { name = "Vik Paruchuri", email = "vik@datalab.to" }, ] requires-python = ">=3.10,<4" keywords = ["ocr", "pdf", "text detection", "text recognition", "tables"] dependencies = [ "transformers>=4.56.1", "torch>=2.7.0,<3", "pydantic>=2.5.3,<3", "pydantic-settings>=2.1.0,<3", "python-dotenv>=1.0.0,<2", "pillow>=10.2.0,<11", "pypdfium2==4.30.0", "filetype>=1.2.0,<2", "click>=8.1.8,<9", "platformdirs>=4.3.6,<5", "opencv-python-headless==4.11.0.86", "openai>=1.55.0,<2", "httpx>=0.27.0,<0.28", "huggingface-hub>=0.26.0,<1", "filelock>=3.16.0,<4", "beautifulsoup4>=4.12.0,<5", ] [project.urls] Repository = "https://github.com/datalab-to/surya" [project.scripts] surya_detect = "surya.scripts.detect_text:detect_text_cli" surya_ocr = "surya.scripts.ocr_text:ocr_text_cli" surya_layout = "surya.scripts.detect_layout:detect_layout_cli" surya_gui = "surya.scripts.run_streamlit_app:streamlit_app_cli" surya_table = "surya.scripts.table_recognition:table_recognition_cli" surya_screenshot = "surya.scripts.screenshot_app:main" [dependency-groups] dev = [ "pre-commit>=4.2.0", "jupyter>=1.0.0", "pymupdf>=1.23.8", "datasets>=2.16.1", "streamlit>=1.31.0", "pytest>=8.3.4", "pdftext>=0.5.1", "tabulate>=0.9.0", "flask>=3.0.0", ] [build-system] requires = ["hatchling"] build-backend = "hatchling.build" [tool.hatch.build.targets.wheel] packages = ["surya"]