Vik Paruchuri
commited on
Commit
·
7a9ab8a
1
Parent(s):
c9f5e37
Fix issue with config passing
Browse files- marker/config/printer.py +1 -5
- marker/logger.py +4 -2
- marker/settings.py +4 -1
- poetry.lock +140 -102
- pyproject.toml +2 -2
- tests/config/test_config.py +11 -1
marker/config/printer.py
CHANGED
|
@@ -6,8 +6,6 @@ from marker.config.crawler import crawler
|
|
| 6 |
|
| 7 |
|
| 8 |
class CustomClickPrinter(click.Command):
|
| 9 |
-
force_flags = ["use_llm"]
|
| 10 |
-
|
| 11 |
def parse_args(self, ctx, args):
|
| 12 |
display_help = "config" in args and "--help" in args
|
| 13 |
if display_help:
|
|
@@ -49,9 +47,6 @@ class CustomClickPrinter(click.Command):
|
|
| 49 |
# Add shared attribute options first
|
| 50 |
for attr, info in shared_attrs.items():
|
| 51 |
if info["type"] in attr_types:
|
| 52 |
-
if attr in self.force_flags:
|
| 53 |
-
continue
|
| 54 |
-
|
| 55 |
ctx.command.params.append(
|
| 56 |
click.Option(
|
| 57 |
["--" + attr],
|
|
@@ -60,6 +55,7 @@ class CustomClickPrinter(click.Command):
|
|
| 60 |
+ f" (Applies to: {', '.join(info['classes'])})",
|
| 61 |
default=None, # This is important, or it sets all the default keys again in config
|
| 62 |
is_flag=info["is_flag"],
|
|
|
|
| 63 |
)
|
| 64 |
)
|
| 65 |
|
|
|
|
| 6 |
|
| 7 |
|
| 8 |
class CustomClickPrinter(click.Command):
|
|
|
|
|
|
|
| 9 |
def parse_args(self, ctx, args):
|
| 10 |
display_help = "config" in args and "--help" in args
|
| 11 |
if display_help:
|
|
|
|
| 47 |
# Add shared attribute options first
|
| 48 |
for attr, info in shared_attrs.items():
|
| 49 |
if info["type"] in attr_types:
|
|
|
|
|
|
|
|
|
|
| 50 |
ctx.command.params.append(
|
| 51 |
click.Option(
|
| 52 |
["--" + attr],
|
|
|
|
| 55 |
+ f" (Applies to: {', '.join(info['classes'])})",
|
| 56 |
default=None, # This is important, or it sets all the default keys again in config
|
| 57 |
is_flag=info["is_flag"],
|
| 58 |
+
flag_value=True if info["is_flag"] else None,
|
| 59 |
)
|
| 60 |
)
|
| 61 |
|
marker/logger.py
CHANGED
|
@@ -1,10 +1,12 @@
|
|
| 1 |
import logging
|
| 2 |
import warnings
|
| 3 |
|
|
|
|
|
|
|
| 4 |
|
| 5 |
def configure_logging():
|
| 6 |
# Setup marker logger
|
| 7 |
-
logger =
|
| 8 |
|
| 9 |
if not logger.handlers:
|
| 10 |
handler = logging.StreamHandler()
|
|
@@ -14,7 +16,7 @@ def configure_logging():
|
|
| 14 |
handler.setFormatter(formatter)
|
| 15 |
logger.addHandler(handler)
|
| 16 |
|
| 17 |
-
logger.setLevel(
|
| 18 |
|
| 19 |
# Ignore future warnings
|
| 20 |
warnings.simplefilter(action="ignore", category=FutureWarning)
|
|
|
|
| 1 |
import logging
|
| 2 |
import warnings
|
| 3 |
|
| 4 |
+
from marker.settings import settings
|
| 5 |
+
|
| 6 |
|
| 7 |
def configure_logging():
|
| 8 |
# Setup marker logger
|
| 9 |
+
logger = get_logger()
|
| 10 |
|
| 11 |
if not logger.handlers:
|
| 12 |
handler = logging.StreamHandler()
|
|
|
|
| 16 |
handler.setFormatter(formatter)
|
| 17 |
logger.addHandler(handler)
|
| 18 |
|
| 19 |
+
logger.setLevel(settings.LOGLEVEL)
|
| 20 |
|
| 21 |
# Ignore future warnings
|
| 22 |
warnings.simplefilter(action="ignore", category=FutureWarning)
|
marker/settings.py
CHANGED
|
@@ -16,6 +16,7 @@ class Settings(BaseSettings):
|
|
| 16 |
ARTIFACT_URL: str = "https://models.datalab.to/artifacts"
|
| 17 |
FONT_NAME: str = "GoNotoCurrent-Regular.ttf"
|
| 18 |
FONT_PATH: str = os.path.join(FONT_DIR, FONT_NAME)
|
|
|
|
| 19 |
|
| 20 |
# General
|
| 21 |
OUTPUT_ENCODING: str = "utf-8"
|
|
@@ -25,7 +26,9 @@ class Settings(BaseSettings):
|
|
| 25 |
GOOGLE_API_KEY: Optional[str] = ""
|
| 26 |
|
| 27 |
# General models
|
| 28 |
-
TORCH_DEVICE: Optional[str] =
|
|
|
|
|
|
|
| 29 |
|
| 30 |
@computed_field
|
| 31 |
@property
|
|
|
|
| 16 |
ARTIFACT_URL: str = "https://models.datalab.to/artifacts"
|
| 17 |
FONT_NAME: str = "GoNotoCurrent-Regular.ttf"
|
| 18 |
FONT_PATH: str = os.path.join(FONT_DIR, FONT_NAME)
|
| 19 |
+
LOGLEVEL: str = "INFO"
|
| 20 |
|
| 21 |
# General
|
| 22 |
OUTPUT_ENCODING: str = "utf-8"
|
|
|
|
| 26 |
GOOGLE_API_KEY: Optional[str] = ""
|
| 27 |
|
| 28 |
# General models
|
| 29 |
+
TORCH_DEVICE: Optional[str] = (
|
| 30 |
+
None # Note: MPS device does not work for text detection, and will default to CPU
|
| 31 |
+
)
|
| 32 |
|
| 33 |
@computed_field
|
| 34 |
@property
|
poetry.lock
CHANGED
|
@@ -3099,71 +3099,76 @@ files = [
|
|
| 3099 |
|
| 3100 |
[[package]]
|
| 3101 |
name = "nvidia-cublas-cu12"
|
| 3102 |
-
version = "12.4.
|
| 3103 |
description = "CUBLAS native runtime libraries"
|
| 3104 |
optional = false
|
| 3105 |
python-versions = ">=3"
|
| 3106 |
groups = ["main"]
|
| 3107 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3108 |
files = [
|
| 3109 |
-
{file = "nvidia_cublas_cu12-12.4.
|
| 3110 |
-
{file = "nvidia_cublas_cu12-12.4.
|
| 3111 |
-
{file = "nvidia_cublas_cu12-12.4.
|
| 3112 |
]
|
| 3113 |
|
| 3114 |
[[package]]
|
| 3115 |
name = "nvidia-cuda-cupti-cu12"
|
| 3116 |
-
version = "12.
|
| 3117 |
description = "CUDA profiling tools runtime libs."
|
| 3118 |
optional = false
|
| 3119 |
python-versions = ">=3"
|
| 3120 |
groups = ["main"]
|
| 3121 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3122 |
files = [
|
| 3123 |
-
{file = "nvidia_cuda_cupti_cu12-12.
|
| 3124 |
-
{file = "nvidia_cuda_cupti_cu12-12.
|
| 3125 |
-
{file = "nvidia_cuda_cupti_cu12-12.
|
|
|
|
|
|
|
| 3126 |
]
|
| 3127 |
|
| 3128 |
[[package]]
|
| 3129 |
name = "nvidia-cuda-nvrtc-cu12"
|
| 3130 |
-
version = "12.
|
| 3131 |
description = "NVRTC native runtime libraries"
|
| 3132 |
optional = false
|
| 3133 |
python-versions = ">=3"
|
| 3134 |
groups = ["main"]
|
| 3135 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3136 |
files = [
|
| 3137 |
-
{file = "nvidia_cuda_nvrtc_cu12-12.
|
| 3138 |
-
{file = "nvidia_cuda_nvrtc_cu12-12.
|
| 3139 |
-
{file = "nvidia_cuda_nvrtc_cu12-12.
|
| 3140 |
]
|
| 3141 |
|
| 3142 |
[[package]]
|
| 3143 |
name = "nvidia-cuda-runtime-cu12"
|
| 3144 |
-
version = "12.
|
| 3145 |
description = "CUDA Runtime native Libraries"
|
| 3146 |
optional = false
|
| 3147 |
python-versions = ">=3"
|
| 3148 |
groups = ["main"]
|
| 3149 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3150 |
files = [
|
| 3151 |
-
{file = "nvidia_cuda_runtime_cu12-12.
|
| 3152 |
-
{file = "nvidia_cuda_runtime_cu12-12.
|
| 3153 |
-
{file = "nvidia_cuda_runtime_cu12-12.
|
|
|
|
|
|
|
| 3154 |
]
|
| 3155 |
|
| 3156 |
[[package]]
|
| 3157 |
name = "nvidia-cudnn-cu12"
|
| 3158 |
-
version = "9.1.
|
| 3159 |
description = "cuDNN runtime libraries"
|
| 3160 |
optional = false
|
| 3161 |
python-versions = ">=3"
|
| 3162 |
groups = ["main"]
|
| 3163 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3164 |
files = [
|
| 3165 |
-
{file = "nvidia_cudnn_cu12-9.1.
|
| 3166 |
-
{file = "nvidia_cudnn_cu12-9.1.
|
|
|
|
| 3167 |
]
|
| 3168 |
|
| 3169 |
[package.dependencies]
|
|
@@ -3171,47 +3176,66 @@ nvidia-cublas-cu12 = "*"
|
|
| 3171 |
|
| 3172 |
[[package]]
|
| 3173 |
name = "nvidia-cufft-cu12"
|
| 3174 |
-
version = "11.
|
| 3175 |
description = "CUFFT native runtime libraries"
|
| 3176 |
optional = false
|
| 3177 |
python-versions = ">=3"
|
| 3178 |
groups = ["main"]
|
| 3179 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3180 |
files = [
|
| 3181 |
-
{file = "nvidia_cufft_cu12-11.
|
| 3182 |
-
{file = "nvidia_cufft_cu12-11.
|
| 3183 |
-
{file = "nvidia_cufft_cu12-11.
|
|
|
|
|
|
|
| 3184 |
]
|
| 3185 |
|
| 3186 |
[package.dependencies]
|
| 3187 |
nvidia-nvjitlink-cu12 = "*"
|
| 3188 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3189 |
[[package]]
|
| 3190 |
name = "nvidia-curand-cu12"
|
| 3191 |
-
version = "10.3.
|
| 3192 |
description = "CURAND native runtime libraries"
|
| 3193 |
optional = false
|
| 3194 |
python-versions = ">=3"
|
| 3195 |
groups = ["main"]
|
| 3196 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3197 |
files = [
|
| 3198 |
-
{file = "nvidia_curand_cu12-10.3.
|
| 3199 |
-
{file = "nvidia_curand_cu12-10.3.
|
| 3200 |
-
{file = "nvidia_curand_cu12-10.3.
|
|
|
|
|
|
|
| 3201 |
]
|
| 3202 |
|
| 3203 |
[[package]]
|
| 3204 |
name = "nvidia-cusolver-cu12"
|
| 3205 |
-
version = "11.
|
| 3206 |
description = "CUDA solver native runtime libraries"
|
| 3207 |
optional = false
|
| 3208 |
python-versions = ">=3"
|
| 3209 |
groups = ["main"]
|
| 3210 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3211 |
files = [
|
| 3212 |
-
{file = "nvidia_cusolver_cu12-11.
|
| 3213 |
-
{file = "nvidia_cusolver_cu12-11.
|
| 3214 |
-
{file = "nvidia_cusolver_cu12-11.
|
|
|
|
|
|
|
| 3215 |
]
|
| 3216 |
|
| 3217 |
[package.dependencies]
|
|
@@ -3221,16 +3245,18 @@ nvidia-nvjitlink-cu12 = "*"
|
|
| 3221 |
|
| 3222 |
[[package]]
|
| 3223 |
name = "nvidia-cusparse-cu12"
|
| 3224 |
-
version = "12.
|
| 3225 |
description = "CUSPARSE native runtime libraries"
|
| 3226 |
optional = false
|
| 3227 |
python-versions = ">=3"
|
| 3228 |
groups = ["main"]
|
| 3229 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3230 |
files = [
|
| 3231 |
-
{file = "nvidia_cusparse_cu12-12.
|
| 3232 |
-
{file = "nvidia_cusparse_cu12-12.
|
| 3233 |
-
{file = "nvidia_cusparse_cu12-12.
|
|
|
|
|
|
|
| 3234 |
]
|
| 3235 |
|
| 3236 |
[package.dependencies]
|
|
@@ -3238,56 +3264,59 @@ nvidia-nvjitlink-cu12 = "*"
|
|
| 3238 |
|
| 3239 |
[[package]]
|
| 3240 |
name = "nvidia-cusparselt-cu12"
|
| 3241 |
-
version = "0.6.
|
| 3242 |
description = "NVIDIA cuSPARSELt"
|
| 3243 |
optional = false
|
| 3244 |
python-versions = "*"
|
| 3245 |
groups = ["main"]
|
| 3246 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3247 |
files = [
|
| 3248 |
-
{file = "nvidia_cusparselt_cu12-0.6.
|
| 3249 |
-
{file = "nvidia_cusparselt_cu12-0.6.
|
| 3250 |
-
{file = "nvidia_cusparselt_cu12-0.6.
|
| 3251 |
]
|
| 3252 |
|
| 3253 |
[[package]]
|
| 3254 |
name = "nvidia-nccl-cu12"
|
| 3255 |
-
version = "2.
|
| 3256 |
description = "NVIDIA Collective Communication Library (NCCL) Runtime"
|
| 3257 |
optional = false
|
| 3258 |
python-versions = ">=3"
|
| 3259 |
groups = ["main"]
|
| 3260 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3261 |
files = [
|
| 3262 |
-
{file = "nvidia_nccl_cu12-2.
|
|
|
|
| 3263 |
]
|
| 3264 |
|
| 3265 |
[[package]]
|
| 3266 |
name = "nvidia-nvjitlink-cu12"
|
| 3267 |
-
version = "12.
|
| 3268 |
description = "Nvidia JIT LTO Library"
|
| 3269 |
optional = false
|
| 3270 |
python-versions = ">=3"
|
| 3271 |
groups = ["main"]
|
| 3272 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3273 |
files = [
|
| 3274 |
-
{file = "nvidia_nvjitlink_cu12-12.
|
| 3275 |
-
{file = "nvidia_nvjitlink_cu12-12.
|
| 3276 |
-
{file = "nvidia_nvjitlink_cu12-12.
|
| 3277 |
]
|
| 3278 |
|
| 3279 |
[[package]]
|
| 3280 |
name = "nvidia-nvtx-cu12"
|
| 3281 |
-
version = "12.
|
| 3282 |
description = "NVIDIA Tools Extension"
|
| 3283 |
optional = false
|
| 3284 |
python-versions = ">=3"
|
| 3285 |
groups = ["main"]
|
| 3286 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3287 |
files = [
|
| 3288 |
-
{file = "nvidia_nvtx_cu12-12.
|
| 3289 |
-
{file = "nvidia_nvtx_cu12-12.
|
| 3290 |
-
{file = "nvidia_nvtx_cu12-12.
|
|
|
|
|
|
|
| 3291 |
]
|
| 3292 |
|
| 3293 |
[[package]]
|
|
@@ -5206,7 +5235,7 @@ files = [
|
|
| 5206 |
{file = "setuptools-77.0.3-py3-none-any.whl", hash = "sha256:67122e78221da5cf550ddd04cf8742c8fe12094483749a792d56cd669d6cf58c"},
|
| 5207 |
{file = "setuptools-77.0.3.tar.gz", hash = "sha256:583b361c8da8de57403743e756609670de6fb2345920e36dc5c2d914c319c945"},
|
| 5208 |
]
|
| 5209 |
-
markers = {main = "python_version >= \"3.12\""}
|
| 5210 |
|
| 5211 |
[package.extras]
|
| 5212 |
check = ["pytest-checkdocs (>=2.4)", "pytest-ruff (>=0.2.1) ; sys_platform != \"cygwin\"", "ruff (>=0.8.0) ; sys_platform != \"cygwin\""]
|
|
@@ -5361,14 +5390,14 @@ snowflake = ["snowflake-connector-python (>=3.3.0) ; python_version < \"3.12\"",
|
|
| 5361 |
|
| 5362 |
[[package]]
|
| 5363 |
name = "surya-ocr"
|
| 5364 |
-
version = "0.14.
|
| 5365 |
description = "OCR, layout, reading order, and table recognition in 90+ languages"
|
| 5366 |
optional = false
|
| 5367 |
python-versions = "<4.0,>=3.10"
|
| 5368 |
groups = ["main"]
|
| 5369 |
files = [
|
| 5370 |
-
{file = "surya_ocr-0.14.
|
| 5371 |
-
{file = "surya_ocr-0.14.
|
| 5372 |
]
|
| 5373 |
|
| 5374 |
[package.dependencies]
|
|
@@ -5383,19 +5412,19 @@ pydantic = ">=2.5.3,<3.0.0"
|
|
| 5383 |
pydantic-settings = ">=2.1.0,<3.0.0"
|
| 5384 |
pypdfium2 = "4.30.0"
|
| 5385 |
python-dotenv = ">=1.0.0,<2.0.0"
|
| 5386 |
-
torch = ">=2.
|
| 5387 |
transformers = ">=4.51.2,<5.0.0"
|
| 5388 |
|
| 5389 |
[[package]]
|
| 5390 |
name = "sympy"
|
| 5391 |
-
version = "1.
|
| 5392 |
description = "Computer algebra system (CAS) in Python"
|
| 5393 |
optional = false
|
| 5394 |
-
python-versions = ">=3.
|
| 5395 |
groups = ["main"]
|
| 5396 |
files = [
|
| 5397 |
-
{file = "sympy-1.
|
| 5398 |
-
{file = "sympy-1.
|
| 5399 |
]
|
| 5400 |
|
| 5401 |
[package.dependencies]
|
|
@@ -5599,32 +5628,36 @@ files = [
|
|
| 5599 |
|
| 5600 |
[[package]]
|
| 5601 |
name = "torch"
|
| 5602 |
-
version = "2.
|
| 5603 |
description = "Tensors and Dynamic neural networks in Python with strong GPU acceleration"
|
| 5604 |
optional = false
|
| 5605 |
python-versions = ">=3.9.0"
|
| 5606 |
groups = ["main"]
|
| 5607 |
files = [
|
| 5608 |
-
{file = "torch-2.
|
| 5609 |
-
{file = "torch-2.
|
| 5610 |
-
{file = "torch-2.
|
| 5611 |
-
{file = "torch-2.
|
| 5612 |
-
{file = "torch-2.
|
| 5613 |
-
{file = "torch-2.
|
| 5614 |
-
{file = "torch-2.
|
| 5615 |
-
{file = "torch-2.
|
| 5616 |
-
{file = "torch-2.
|
| 5617 |
-
{file = "torch-2.
|
| 5618 |
-
{file = "torch-2.
|
| 5619 |
-
{file = "torch-2.
|
| 5620 |
-
{file = "torch-2.
|
| 5621 |
-
{file = "torch-2.
|
| 5622 |
-
{file = "torch-2.
|
| 5623 |
-
{file = "torch-2.
|
| 5624 |
-
{file = "torch-2.
|
| 5625 |
-
{file = "torch-2.
|
| 5626 |
-
{file = "torch-2.
|
| 5627 |
-
{file = "torch-2.
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5628 |
]
|
| 5629 |
|
| 5630 |
[package.dependencies]
|
|
@@ -5632,22 +5665,23 @@ filelock = "*"
|
|
| 5632 |
fsspec = "*"
|
| 5633 |
jinja2 = "*"
|
| 5634 |
networkx = "*"
|
| 5635 |
-
nvidia-cublas-cu12 = {version = "12.4.
|
| 5636 |
-
nvidia-cuda-cupti-cu12 = {version = "12.
|
| 5637 |
-
nvidia-cuda-nvrtc-cu12 = {version = "12.
|
| 5638 |
-
nvidia-cuda-runtime-cu12 = {version = "12.
|
| 5639 |
-
nvidia-cudnn-cu12 = {version = "9.1.
|
| 5640 |
-
nvidia-cufft-cu12 = {version = "11.
|
| 5641 |
-
nvidia-
|
| 5642 |
-
nvidia-
|
| 5643 |
-
nvidia-
|
| 5644 |
-
nvidia-
|
| 5645 |
-
nvidia-
|
| 5646 |
-
nvidia-
|
| 5647 |
-
nvidia-
|
|
|
|
| 5648 |
setuptools = {version = "*", markers = "python_version >= \"3.12\""}
|
| 5649 |
-
sympy =
|
| 5650 |
-
triton = {version = "3.
|
| 5651 |
typing-extensions = ">=4.10.0"
|
| 5652 |
|
| 5653 |
[package.extras]
|
|
@@ -5788,23 +5822,27 @@ vision = ["Pillow (>=10.0.1,<=15.0)"]
|
|
| 5788 |
|
| 5789 |
[[package]]
|
| 5790 |
name = "triton"
|
| 5791 |
-
version = "3.
|
| 5792 |
description = "A language and compiler for custom Deep Learning operations"
|
| 5793 |
optional = false
|
| 5794 |
python-versions = "*"
|
| 5795 |
groups = ["main"]
|
| 5796 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 5797 |
files = [
|
| 5798 |
-
{file = "triton-3.
|
| 5799 |
-
{file = "triton-3.
|
| 5800 |
-
{file = "triton-3.
|
| 5801 |
-
{file = "triton-3.
|
| 5802 |
-
{file = "triton-3.
|
|
|
|
| 5803 |
]
|
| 5804 |
|
|
|
|
|
|
|
|
|
|
| 5805 |
[package.extras]
|
| 5806 |
build = ["cmake (>=3.20)", "lit"]
|
| 5807 |
-
tests = ["autopep8", "
|
| 5808 |
tutorials = ["matplotlib", "pandas", "tabulate"]
|
| 5809 |
|
| 5810 |
[[package]]
|
|
@@ -6467,4 +6505,4 @@ full = ["ebooklib", "mammoth", "openpyxl", "python-pptx", "weasyprint"]
|
|
| 6467 |
[metadata]
|
| 6468 |
lock-version = "2.1"
|
| 6469 |
python-versions = "^3.10"
|
| 6470 |
-
content-hash = "
|
|
|
|
| 3099 |
|
| 3100 |
[[package]]
|
| 3101 |
name = "nvidia-cublas-cu12"
|
| 3102 |
+
version = "12.6.4.1"
|
| 3103 |
description = "CUBLAS native runtime libraries"
|
| 3104 |
optional = false
|
| 3105 |
python-versions = ">=3"
|
| 3106 |
groups = ["main"]
|
| 3107 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3108 |
files = [
|
| 3109 |
+
{file = "nvidia_cublas_cu12-12.6.4.1-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:08ed2686e9875d01b58e3cb379c6896df8e76c75e0d4a7f7dace3d7b6d9ef8eb"},
|
| 3110 |
+
{file = "nvidia_cublas_cu12-12.6.4.1-py3-none-manylinux_2_27_aarch64.whl", hash = "sha256:235f728d6e2a409eddf1df58d5b0921cf80cfa9e72b9f2775ccb7b4a87984668"},
|
| 3111 |
+
{file = "nvidia_cublas_cu12-12.6.4.1-py3-none-win_amd64.whl", hash = "sha256:9e4fa264f4d8a4eb0cdbd34beadc029f453b3bafae02401e999cf3d5a5af75f8"},
|
| 3112 |
]
|
| 3113 |
|
| 3114 |
[[package]]
|
| 3115 |
name = "nvidia-cuda-cupti-cu12"
|
| 3116 |
+
version = "12.6.80"
|
| 3117 |
description = "CUDA profiling tools runtime libs."
|
| 3118 |
optional = false
|
| 3119 |
python-versions = ">=3"
|
| 3120 |
groups = ["main"]
|
| 3121 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3122 |
files = [
|
| 3123 |
+
{file = "nvidia_cuda_cupti_cu12-12.6.80-py3-none-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:166ee35a3ff1587f2490364f90eeeb8da06cd867bd5b701bf7f9a02b78bc63fc"},
|
| 3124 |
+
{file = "nvidia_cuda_cupti_cu12-12.6.80-py3-none-manylinux2014_aarch64.whl", hash = "sha256:358b4a1d35370353d52e12f0a7d1769fc01ff74a191689d3870b2123156184c4"},
|
| 3125 |
+
{file = "nvidia_cuda_cupti_cu12-12.6.80-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:6768bad6cab4f19e8292125e5f1ac8aa7d1718704012a0e3272a6f61c4bce132"},
|
| 3126 |
+
{file = "nvidia_cuda_cupti_cu12-12.6.80-py3-none-manylinux2014_x86_64.whl", hash = "sha256:a3eff6cdfcc6a4c35db968a06fcadb061cbc7d6dde548609a941ff8701b98b73"},
|
| 3127 |
+
{file = "nvidia_cuda_cupti_cu12-12.6.80-py3-none-win_amd64.whl", hash = "sha256:bbe6ae76e83ce5251b56e8c8e61a964f757175682bbad058b170b136266ab00a"},
|
| 3128 |
]
|
| 3129 |
|
| 3130 |
[[package]]
|
| 3131 |
name = "nvidia-cuda-nvrtc-cu12"
|
| 3132 |
+
version = "12.6.77"
|
| 3133 |
description = "NVRTC native runtime libraries"
|
| 3134 |
optional = false
|
| 3135 |
python-versions = ">=3"
|
| 3136 |
groups = ["main"]
|
| 3137 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3138 |
files = [
|
| 3139 |
+
{file = "nvidia_cuda_nvrtc_cu12-12.6.77-py3-none-manylinux2014_aarch64.whl", hash = "sha256:5847f1d6e5b757f1d2b3991a01082a44aad6f10ab3c5c0213fa3e25bddc25a13"},
|
| 3140 |
+
{file = "nvidia_cuda_nvrtc_cu12-12.6.77-py3-none-manylinux2014_x86_64.whl", hash = "sha256:35b0cc6ee3a9636d5409133e79273ce1f3fd087abb0532d2d2e8fff1fe9efc53"},
|
| 3141 |
+
{file = "nvidia_cuda_nvrtc_cu12-12.6.77-py3-none-win_amd64.whl", hash = "sha256:f7007dbd914c56bd80ea31bc43e8e149da38f68158f423ba845fc3292684e45a"},
|
| 3142 |
]
|
| 3143 |
|
| 3144 |
[[package]]
|
| 3145 |
name = "nvidia-cuda-runtime-cu12"
|
| 3146 |
+
version = "12.6.77"
|
| 3147 |
description = "CUDA Runtime native Libraries"
|
| 3148 |
optional = false
|
| 3149 |
python-versions = ">=3"
|
| 3150 |
groups = ["main"]
|
| 3151 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3152 |
files = [
|
| 3153 |
+
{file = "nvidia_cuda_runtime_cu12-12.6.77-py3-none-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:6116fad3e049e04791c0256a9778c16237837c08b27ed8c8401e2e45de8d60cd"},
|
| 3154 |
+
{file = "nvidia_cuda_runtime_cu12-12.6.77-py3-none-manylinux2014_aarch64.whl", hash = "sha256:d461264ecb429c84c8879a7153499ddc7b19b5f8d84c204307491989a365588e"},
|
| 3155 |
+
{file = "nvidia_cuda_runtime_cu12-12.6.77-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:ba3b56a4f896141e25e19ab287cd71e52a6a0f4b29d0d31609f60e3b4d5219b7"},
|
| 3156 |
+
{file = "nvidia_cuda_runtime_cu12-12.6.77-py3-none-manylinux2014_x86_64.whl", hash = "sha256:a84d15d5e1da416dd4774cb42edf5e954a3e60cc945698dc1d5be02321c44dc8"},
|
| 3157 |
+
{file = "nvidia_cuda_runtime_cu12-12.6.77-py3-none-win_amd64.whl", hash = "sha256:86c58044c824bf3c173c49a2dbc7a6c8b53cb4e4dca50068be0bf64e9dab3f7f"},
|
| 3158 |
]
|
| 3159 |
|
| 3160 |
[[package]]
|
| 3161 |
name = "nvidia-cudnn-cu12"
|
| 3162 |
+
version = "9.5.1.17"
|
| 3163 |
description = "cuDNN runtime libraries"
|
| 3164 |
optional = false
|
| 3165 |
python-versions = ">=3"
|
| 3166 |
groups = ["main"]
|
| 3167 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3168 |
files = [
|
| 3169 |
+
{file = "nvidia_cudnn_cu12-9.5.1.17-py3-none-manylinux_2_28_aarch64.whl", hash = "sha256:9fd4584468533c61873e5fda8ca41bac3a38bcb2d12350830c69b0a96a7e4def"},
|
| 3170 |
+
{file = "nvidia_cudnn_cu12-9.5.1.17-py3-none-manylinux_2_28_x86_64.whl", hash = "sha256:30ac3869f6db17d170e0e556dd6cc5eee02647abc31ca856634d5a40f82c15b2"},
|
| 3171 |
+
{file = "nvidia_cudnn_cu12-9.5.1.17-py3-none-win_amd64.whl", hash = "sha256:d7af0f8a4f3b4b9dbb3122f2ef553b45694ed9c384d5a75bab197b8eefb79ab8"},
|
| 3172 |
]
|
| 3173 |
|
| 3174 |
[package.dependencies]
|
|
|
|
| 3176 |
|
| 3177 |
[[package]]
|
| 3178 |
name = "nvidia-cufft-cu12"
|
| 3179 |
+
version = "11.3.0.4"
|
| 3180 |
description = "CUFFT native runtime libraries"
|
| 3181 |
optional = false
|
| 3182 |
python-versions = ">=3"
|
| 3183 |
groups = ["main"]
|
| 3184 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3185 |
files = [
|
| 3186 |
+
{file = "nvidia_cufft_cu12-11.3.0.4-py3-none-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:d16079550df460376455cba121db6564089176d9bac9e4f360493ca4741b22a6"},
|
| 3187 |
+
{file = "nvidia_cufft_cu12-11.3.0.4-py3-none-manylinux2014_aarch64.whl", hash = "sha256:8510990de9f96c803a051822618d42bf6cb8f069ff3f48d93a8486efdacb48fb"},
|
| 3188 |
+
{file = "nvidia_cufft_cu12-11.3.0.4-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:ccba62eb9cef5559abd5e0d54ceed2d9934030f51163df018532142a8ec533e5"},
|
| 3189 |
+
{file = "nvidia_cufft_cu12-11.3.0.4-py3-none-manylinux2014_x86_64.whl", hash = "sha256:768160ac89f6f7b459bee747e8d175dbf53619cfe74b2a5636264163138013ca"},
|
| 3190 |
+
{file = "nvidia_cufft_cu12-11.3.0.4-py3-none-win_amd64.whl", hash = "sha256:6048ebddfb90d09d2707efb1fd78d4e3a77cb3ae4dc60e19aab6be0ece2ae464"},
|
| 3191 |
]
|
| 3192 |
|
| 3193 |
[package.dependencies]
|
| 3194 |
nvidia-nvjitlink-cu12 = "*"
|
| 3195 |
|
| 3196 |
+
[[package]]
|
| 3197 |
+
name = "nvidia-cufile-cu12"
|
| 3198 |
+
version = "1.11.1.6"
|
| 3199 |
+
description = "cuFile GPUDirect libraries"
|
| 3200 |
+
optional = false
|
| 3201 |
+
python-versions = ">=3"
|
| 3202 |
+
groups = ["main"]
|
| 3203 |
+
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3204 |
+
files = [
|
| 3205 |
+
{file = "nvidia_cufile_cu12-1.11.1.6-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:cc23469d1c7e52ce6c1d55253273d32c565dd22068647f3aa59b3c6b005bf159"},
|
| 3206 |
+
{file = "nvidia_cufile_cu12-1.11.1.6-py3-none-manylinux_2_27_aarch64.whl", hash = "sha256:8f57a0051dcf2543f6dc2b98a98cb2719c37d3cee1baba8965d57f3bbc90d4db"},
|
| 3207 |
+
]
|
| 3208 |
+
|
| 3209 |
[[package]]
|
| 3210 |
name = "nvidia-curand-cu12"
|
| 3211 |
+
version = "10.3.7.77"
|
| 3212 |
description = "CURAND native runtime libraries"
|
| 3213 |
optional = false
|
| 3214 |
python-versions = ">=3"
|
| 3215 |
groups = ["main"]
|
| 3216 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3217 |
files = [
|
| 3218 |
+
{file = "nvidia_curand_cu12-10.3.7.77-py3-none-manylinux2014_aarch64.whl", hash = "sha256:6e82df077060ea28e37f48a3ec442a8f47690c7499bff392a5938614b56c98d8"},
|
| 3219 |
+
{file = "nvidia_curand_cu12-10.3.7.77-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:a42cd1344297f70b9e39a1e4f467a4e1c10f1da54ff7a85c12197f6c652c8bdf"},
|
| 3220 |
+
{file = "nvidia_curand_cu12-10.3.7.77-py3-none-manylinux2014_x86_64.whl", hash = "sha256:99f1a32f1ac2bd134897fc7a203f779303261268a65762a623bf30cc9fe79117"},
|
| 3221 |
+
{file = "nvidia_curand_cu12-10.3.7.77-py3-none-manylinux_2_27_aarch64.whl", hash = "sha256:7b2ed8e95595c3591d984ea3603dd66fe6ce6812b886d59049988a712ed06b6e"},
|
| 3222 |
+
{file = "nvidia_curand_cu12-10.3.7.77-py3-none-win_amd64.whl", hash = "sha256:6d6d935ffba0f3d439b7cd968192ff068fafd9018dbf1b85b37261b13cfc9905"},
|
| 3223 |
]
|
| 3224 |
|
| 3225 |
[[package]]
|
| 3226 |
name = "nvidia-cusolver-cu12"
|
| 3227 |
+
version = "11.7.1.2"
|
| 3228 |
description = "CUDA solver native runtime libraries"
|
| 3229 |
optional = false
|
| 3230 |
python-versions = ">=3"
|
| 3231 |
groups = ["main"]
|
| 3232 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3233 |
files = [
|
| 3234 |
+
{file = "nvidia_cusolver_cu12-11.7.1.2-py3-none-manylinux2014_aarch64.whl", hash = "sha256:0ce237ef60acde1efc457335a2ddadfd7610b892d94efee7b776c64bb1cac9e0"},
|
| 3235 |
+
{file = "nvidia_cusolver_cu12-11.7.1.2-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:e9e49843a7707e42022babb9bcfa33c29857a93b88020c4e4434656a655b698c"},
|
| 3236 |
+
{file = "nvidia_cusolver_cu12-11.7.1.2-py3-none-manylinux2014_x86_64.whl", hash = "sha256:6cf28f17f64107a0c4d7802be5ff5537b2130bfc112f25d5a30df227058ca0e6"},
|
| 3237 |
+
{file = "nvidia_cusolver_cu12-11.7.1.2-py3-none-manylinux_2_27_aarch64.whl", hash = "sha256:dbbe4fc38ec1289c7e5230e16248365e375c3673c9c8bac5796e2e20db07f56e"},
|
| 3238 |
+
{file = "nvidia_cusolver_cu12-11.7.1.2-py3-none-win_amd64.whl", hash = "sha256:6813f9d8073f555444a8705f3ab0296d3e1cb37a16d694c5fc8b862a0d8706d7"},
|
| 3239 |
]
|
| 3240 |
|
| 3241 |
[package.dependencies]
|
|
|
|
| 3245 |
|
| 3246 |
[[package]]
|
| 3247 |
name = "nvidia-cusparse-cu12"
|
| 3248 |
+
version = "12.5.4.2"
|
| 3249 |
description = "CUSPARSE native runtime libraries"
|
| 3250 |
optional = false
|
| 3251 |
python-versions = ">=3"
|
| 3252 |
groups = ["main"]
|
| 3253 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3254 |
files = [
|
| 3255 |
+
{file = "nvidia_cusparse_cu12-12.5.4.2-py3-none-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:d25b62fb18751758fe3c93a4a08eff08effedfe4edf1c6bb5afd0890fe88f887"},
|
| 3256 |
+
{file = "nvidia_cusparse_cu12-12.5.4.2-py3-none-manylinux2014_aarch64.whl", hash = "sha256:7aa32fa5470cf754f72d1116c7cbc300b4e638d3ae5304cfa4a638a5b87161b1"},
|
| 3257 |
+
{file = "nvidia_cusparse_cu12-12.5.4.2-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:7556d9eca156e18184b94947ade0fba5bb47d69cec46bf8660fd2c71a4b48b73"},
|
| 3258 |
+
{file = "nvidia_cusparse_cu12-12.5.4.2-py3-none-manylinux2014_x86_64.whl", hash = "sha256:23749a6571191a215cb74d1cdbff4a86e7b19f1200c071b3fcf844a5bea23a2f"},
|
| 3259 |
+
{file = "nvidia_cusparse_cu12-12.5.4.2-py3-none-win_amd64.whl", hash = "sha256:4acb8c08855a26d737398cba8fb6f8f5045d93f82612b4cfd84645a2332ccf20"},
|
| 3260 |
]
|
| 3261 |
|
| 3262 |
[package.dependencies]
|
|
|
|
| 3264 |
|
| 3265 |
[[package]]
|
| 3266 |
name = "nvidia-cusparselt-cu12"
|
| 3267 |
+
version = "0.6.3"
|
| 3268 |
description = "NVIDIA cuSPARSELt"
|
| 3269 |
optional = false
|
| 3270 |
python-versions = "*"
|
| 3271 |
groups = ["main"]
|
| 3272 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3273 |
files = [
|
| 3274 |
+
{file = "nvidia_cusparselt_cu12-0.6.3-py3-none-manylinux2014_aarch64.whl", hash = "sha256:8371549623ba601a06322af2133c4a44350575f5a3108fb75f3ef20b822ad5f1"},
|
| 3275 |
+
{file = "nvidia_cusparselt_cu12-0.6.3-py3-none-manylinux2014_x86_64.whl", hash = "sha256:e5c8a26c36445dd2e6812f1177978a24e2d37cacce7e090f297a688d1ec44f46"},
|
| 3276 |
+
{file = "nvidia_cusparselt_cu12-0.6.3-py3-none-win_amd64.whl", hash = "sha256:3b325bcbd9b754ba43df5a311488fca11a6b5dc3d11df4d190c000cf1a0765c7"},
|
| 3277 |
]
|
| 3278 |
|
| 3279 |
[[package]]
|
| 3280 |
name = "nvidia-nccl-cu12"
|
| 3281 |
+
version = "2.26.2"
|
| 3282 |
description = "NVIDIA Collective Communication Library (NCCL) Runtime"
|
| 3283 |
optional = false
|
| 3284 |
python-versions = ">=3"
|
| 3285 |
groups = ["main"]
|
| 3286 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3287 |
files = [
|
| 3288 |
+
{file = "nvidia_nccl_cu12-2.26.2-py3-none-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:5c196e95e832ad30fbbb50381eb3cbd1fadd5675e587a548563993609af19522"},
|
| 3289 |
+
{file = "nvidia_nccl_cu12-2.26.2-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:694cf3879a206553cc9d7dbda76b13efaf610fdb70a50cba303de1b0d1530ac6"},
|
| 3290 |
]
|
| 3291 |
|
| 3292 |
[[package]]
|
| 3293 |
name = "nvidia-nvjitlink-cu12"
|
| 3294 |
+
version = "12.6.85"
|
| 3295 |
description = "Nvidia JIT LTO Library"
|
| 3296 |
optional = false
|
| 3297 |
python-versions = ">=3"
|
| 3298 |
groups = ["main"]
|
| 3299 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3300 |
files = [
|
| 3301 |
+
{file = "nvidia_nvjitlink_cu12-12.6.85-py3-none-manylinux2010_x86_64.manylinux_2_12_x86_64.whl", hash = "sha256:eedc36df9e88b682efe4309aa16b5b4e78c2407eac59e8c10a6a47535164369a"},
|
| 3302 |
+
{file = "nvidia_nvjitlink_cu12-12.6.85-py3-none-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:cf4eaa7d4b6b543ffd69d6abfb11efdeb2db48270d94dfd3a452c24150829e41"},
|
| 3303 |
+
{file = "nvidia_nvjitlink_cu12-12.6.85-py3-none-win_amd64.whl", hash = "sha256:e61120e52ed675747825cdd16febc6a0730537451d867ee58bee3853b1b13d1c"},
|
| 3304 |
]
|
| 3305 |
|
| 3306 |
[[package]]
|
| 3307 |
name = "nvidia-nvtx-cu12"
|
| 3308 |
+
version = "12.6.77"
|
| 3309 |
description = "NVIDIA Tools Extension"
|
| 3310 |
optional = false
|
| 3311 |
python-versions = ">=3"
|
| 3312 |
groups = ["main"]
|
| 3313 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 3314 |
files = [
|
| 3315 |
+
{file = "nvidia_nvtx_cu12-12.6.77-py3-none-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:f44f8d86bb7d5629988d61c8d3ae61dddb2015dee142740536bc7481b022fe4b"},
|
| 3316 |
+
{file = "nvidia_nvtx_cu12-12.6.77-py3-none-manylinux2014_aarch64.whl", hash = "sha256:adcaabb9d436c9761fca2b13959a2d237c5f9fd406c8e4b723c695409ff88059"},
|
| 3317 |
+
{file = "nvidia_nvtx_cu12-12.6.77-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:b90bed3df379fa79afbd21be8e04a0314336b8ae16768b58f2d34cb1d04cd7d2"},
|
| 3318 |
+
{file = "nvidia_nvtx_cu12-12.6.77-py3-none-manylinux2014_x86_64.whl", hash = "sha256:6574241a3ec5fdc9334353ab8c479fe75841dbe8f4532a8fc97ce63503330ba1"},
|
| 3319 |
+
{file = "nvidia_nvtx_cu12-12.6.77-py3-none-win_amd64.whl", hash = "sha256:2fb11a4af04a5e6c84073e6404d26588a34afd35379f0855a99797897efa75c0"},
|
| 3320 |
]
|
| 3321 |
|
| 3322 |
[[package]]
|
|
|
|
| 5235 |
{file = "setuptools-77.0.3-py3-none-any.whl", hash = "sha256:67122e78221da5cf550ddd04cf8742c8fe12094483749a792d56cd669d6cf58c"},
|
| 5236 |
{file = "setuptools-77.0.3.tar.gz", hash = "sha256:583b361c8da8de57403743e756609670de6fb2345920e36dc5c2d914c319c945"},
|
| 5237 |
]
|
| 5238 |
+
markers = {main = "platform_system == \"Linux\" and platform_machine == \"x86_64\" or python_version >= \"3.12\""}
|
| 5239 |
|
| 5240 |
[package.extras]
|
| 5241 |
check = ["pytest-checkdocs (>=2.4)", "pytest-ruff (>=0.2.1) ; sys_platform != \"cygwin\"", "ruff (>=0.8.0) ; sys_platform != \"cygwin\""]
|
|
|
|
| 5390 |
|
| 5391 |
[[package]]
|
| 5392 |
name = "surya-ocr"
|
| 5393 |
+
version = "0.14.2"
|
| 5394 |
description = "OCR, layout, reading order, and table recognition in 90+ languages"
|
| 5395 |
optional = false
|
| 5396 |
python-versions = "<4.0,>=3.10"
|
| 5397 |
groups = ["main"]
|
| 5398 |
files = [
|
| 5399 |
+
{file = "surya_ocr-0.14.2-py3-none-any.whl", hash = "sha256:0c402705c860f8bf98fc2bf2a3b49d7f0e16fba587aed6d3f01bb53bb776d283"},
|
| 5400 |
+
{file = "surya_ocr-0.14.2.tar.gz", hash = "sha256:852af681073167beba9a638658c70b81318f1a8f3d558db68dead1b2c391e862"},
|
| 5401 |
]
|
| 5402 |
|
| 5403 |
[package.dependencies]
|
|
|
|
| 5412 |
pydantic-settings = ">=2.1.0,<3.0.0"
|
| 5413 |
pypdfium2 = "4.30.0"
|
| 5414 |
python-dotenv = ">=1.0.0,<2.0.0"
|
| 5415 |
+
torch = ">=2.7.0,<3.0.0"
|
| 5416 |
transformers = ">=4.51.2,<5.0.0"
|
| 5417 |
|
| 5418 |
[[package]]
|
| 5419 |
name = "sympy"
|
| 5420 |
+
version = "1.14.0"
|
| 5421 |
description = "Computer algebra system (CAS) in Python"
|
| 5422 |
optional = false
|
| 5423 |
+
python-versions = ">=3.9"
|
| 5424 |
groups = ["main"]
|
| 5425 |
files = [
|
| 5426 |
+
{file = "sympy-1.14.0-py3-none-any.whl", hash = "sha256:e091cc3e99d2141a0ba2847328f5479b05d94a6635cb96148ccb3f34671bd8f5"},
|
| 5427 |
+
{file = "sympy-1.14.0.tar.gz", hash = "sha256:d3d3fe8df1e5a0b42f0e7bdf50541697dbe7d23746e894990c030e2b05e72517"},
|
| 5428 |
]
|
| 5429 |
|
| 5430 |
[package.dependencies]
|
|
|
|
| 5628 |
|
| 5629 |
[[package]]
|
| 5630 |
name = "torch"
|
| 5631 |
+
version = "2.7.0"
|
| 5632 |
description = "Tensors and Dynamic neural networks in Python with strong GPU acceleration"
|
| 5633 |
optional = false
|
| 5634 |
python-versions = ">=3.9.0"
|
| 5635 |
groups = ["main"]
|
| 5636 |
files = [
|
| 5637 |
+
{file = "torch-2.7.0-cp310-cp310-manylinux_2_28_aarch64.whl", hash = "sha256:c9afea41b11e1a1ab1b258a5c31afbd646d6319042bfe4f231b408034b51128b"},
|
| 5638 |
+
{file = "torch-2.7.0-cp310-cp310-manylinux_2_28_x86_64.whl", hash = "sha256:0b9960183b6e5b71239a3e6c883d8852c304e691c0b2955f7045e8a6d05b9183"},
|
| 5639 |
+
{file = "torch-2.7.0-cp310-cp310-win_amd64.whl", hash = "sha256:2ad79d0d8c2a20a37c5df6052ec67c2078a2c4e9a96dd3a8b55daaff6d28ea29"},
|
| 5640 |
+
{file = "torch-2.7.0-cp310-none-macosx_11_0_arm64.whl", hash = "sha256:34e0168ed6de99121612d72224e59b2a58a83dae64999990eada7260c5dd582d"},
|
| 5641 |
+
{file = "torch-2.7.0-cp311-cp311-manylinux_2_28_aarch64.whl", hash = "sha256:2b7813e904757b125faf1a9a3154e1d50381d539ced34da1992f52440567c156"},
|
| 5642 |
+
{file = "torch-2.7.0-cp311-cp311-manylinux_2_28_x86_64.whl", hash = "sha256:fd5cfbb4c3bbadd57ad1b27d56a28008f8d8753733411a140fcfb84d7f933a25"},
|
| 5643 |
+
{file = "torch-2.7.0-cp311-cp311-win_amd64.whl", hash = "sha256:58df8d5c2eeb81305760282b5069ea4442791a6bbf0c74d9069b7b3304ff8a37"},
|
| 5644 |
+
{file = "torch-2.7.0-cp311-none-macosx_11_0_arm64.whl", hash = "sha256:0a8d43caa342b9986101ec5feb5bbf1d86570b5caa01e9cb426378311258fdde"},
|
| 5645 |
+
{file = "torch-2.7.0-cp312-cp312-manylinux_2_28_aarch64.whl", hash = "sha256:36a6368c7ace41ad1c0f69f18056020b6a5ca47bedaca9a2f3b578f5a104c26c"},
|
| 5646 |
+
{file = "torch-2.7.0-cp312-cp312-manylinux_2_28_x86_64.whl", hash = "sha256:15aab3e31c16feb12ae0a88dba3434a458874636f360c567caa6a91f6bfba481"},
|
| 5647 |
+
{file = "torch-2.7.0-cp312-cp312-win_amd64.whl", hash = "sha256:f56d4b2510934e072bab3ab8987e00e60e1262fb238176168f5e0c43a1320c6d"},
|
| 5648 |
+
{file = "torch-2.7.0-cp312-none-macosx_11_0_arm64.whl", hash = "sha256:30b7688a87239a7de83f269333651d8e582afffce6f591fff08c046f7787296e"},
|
| 5649 |
+
{file = "torch-2.7.0-cp313-cp313-manylinux_2_28_aarch64.whl", hash = "sha256:868ccdc11798535b5727509480cd1d86d74220cfdc42842c4617338c1109a205"},
|
| 5650 |
+
{file = "torch-2.7.0-cp313-cp313-manylinux_2_28_x86_64.whl", hash = "sha256:9b52347118116cf3dff2ab5a3c3dd97c719eb924ac658ca2a7335652076df708"},
|
| 5651 |
+
{file = "torch-2.7.0-cp313-cp313-win_amd64.whl", hash = "sha256:434cf3b378340efc87c758f250e884f34460624c0523fe5c9b518d205c91dd1b"},
|
| 5652 |
+
{file = "torch-2.7.0-cp313-cp313t-macosx_14_0_arm64.whl", hash = "sha256:edad98dddd82220465b106506bb91ee5ce32bd075cddbcf2b443dfaa2cbd83bf"},
|
| 5653 |
+
{file = "torch-2.7.0-cp313-cp313t-manylinux_2_28_aarch64.whl", hash = "sha256:2a885fc25afefb6e6eb18a7d1e8bfa01cc153e92271d980a49243b250d5ab6d9"},
|
| 5654 |
+
{file = "torch-2.7.0-cp313-cp313t-manylinux_2_28_x86_64.whl", hash = "sha256:176300ff5bc11a5f5b0784e40bde9e10a35c4ae9609beed96b4aeb46a27f5fae"},
|
| 5655 |
+
{file = "torch-2.7.0-cp313-cp313t-win_amd64.whl", hash = "sha256:d0ca446a93f474985d81dc866fcc8dccefb9460a29a456f79d99c29a78a66993"},
|
| 5656 |
+
{file = "torch-2.7.0-cp313-none-macosx_11_0_arm64.whl", hash = "sha256:27f5007bdf45f7bb7af7f11d1828d5c2487e030690afb3d89a651fd7036a390e"},
|
| 5657 |
+
{file = "torch-2.7.0-cp39-cp39-manylinux_2_28_aarch64.whl", hash = "sha256:e362efaa5b3078e5f75c33efc05005b9b46de0d2e899519d5b4cad0e050ed0f7"},
|
| 5658 |
+
{file = "torch-2.7.0-cp39-cp39-manylinux_2_28_x86_64.whl", hash = "sha256:fc1ed9258cbfce69970ff508ea60881818d414d098a800b7695ba36f570d34b0"},
|
| 5659 |
+
{file = "torch-2.7.0-cp39-cp39-win_amd64.whl", hash = "sha256:87b0802cab44659fcb6bcf5678d58fa4a8b48561cde8fb2d317edf0b6990e1bb"},
|
| 5660 |
+
{file = "torch-2.7.0-cp39-none-macosx_11_0_arm64.whl", hash = "sha256:ccd7509141713997861b7a947ef0a717143cd7e9240addd168f38ba8fd23fd56"},
|
| 5661 |
]
|
| 5662 |
|
| 5663 |
[package.dependencies]
|
|
|
|
| 5665 |
fsspec = "*"
|
| 5666 |
jinja2 = "*"
|
| 5667 |
networkx = "*"
|
| 5668 |
+
nvidia-cublas-cu12 = {version = "12.6.4.1", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5669 |
+
nvidia-cuda-cupti-cu12 = {version = "12.6.80", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5670 |
+
nvidia-cuda-nvrtc-cu12 = {version = "12.6.77", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5671 |
+
nvidia-cuda-runtime-cu12 = {version = "12.6.77", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5672 |
+
nvidia-cudnn-cu12 = {version = "9.5.1.17", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5673 |
+
nvidia-cufft-cu12 = {version = "11.3.0.4", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5674 |
+
nvidia-cufile-cu12 = {version = "1.11.1.6", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5675 |
+
nvidia-curand-cu12 = {version = "10.3.7.77", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5676 |
+
nvidia-cusolver-cu12 = {version = "11.7.1.2", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5677 |
+
nvidia-cusparse-cu12 = {version = "12.5.4.2", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5678 |
+
nvidia-cusparselt-cu12 = {version = "0.6.3", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5679 |
+
nvidia-nccl-cu12 = {version = "2.26.2", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5680 |
+
nvidia-nvjitlink-cu12 = {version = "12.6.85", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5681 |
+
nvidia-nvtx-cu12 = {version = "12.6.77", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5682 |
setuptools = {version = "*", markers = "python_version >= \"3.12\""}
|
| 5683 |
+
sympy = ">=1.13.3"
|
| 5684 |
+
triton = {version = "3.3.0", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
|
| 5685 |
typing-extensions = ">=4.10.0"
|
| 5686 |
|
| 5687 |
[package.extras]
|
|
|
|
| 5822 |
|
| 5823 |
[[package]]
|
| 5824 |
name = "triton"
|
| 5825 |
+
version = "3.3.0"
|
| 5826 |
description = "A language and compiler for custom Deep Learning operations"
|
| 5827 |
optional = false
|
| 5828 |
python-versions = "*"
|
| 5829 |
groups = ["main"]
|
| 5830 |
markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""
|
| 5831 |
files = [
|
| 5832 |
+
{file = "triton-3.3.0-cp310-cp310-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:fad99beafc860501d7fcc1fb7045d9496cbe2c882b1674640304949165a916e7"},
|
| 5833 |
+
{file = "triton-3.3.0-cp311-cp311-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:3161a2bf073d6b22c4e2f33f951f3e5e3001462b2570e6df9cd57565bdec2984"},
|
| 5834 |
+
{file = "triton-3.3.0-cp312-cp312-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:b68c778f6c4218403a6bd01be7484f6dc9e20fe2083d22dd8aef33e3b87a10a3"},
|
| 5835 |
+
{file = "triton-3.3.0-cp313-cp313-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:47bc87ad66fa4ef17968299acacecaab71ce40a238890acc6ad197c3abe2b8f1"},
|
| 5836 |
+
{file = "triton-3.3.0-cp313-cp313t-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:ce4700fc14032af1e049005ae94ba908e71cd6c2df682239aed08e49bc71b742"},
|
| 5837 |
+
{file = "triton-3.3.0-cp39-cp39-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:1f41403bfa0cbb3e24fd958ca7fee04e9681e55e539296db9aca30c42acae693"},
|
| 5838 |
]
|
| 5839 |
|
| 5840 |
+
[package.dependencies]
|
| 5841 |
+
setuptools = ">=40.8.0"
|
| 5842 |
+
|
| 5843 |
[package.extras]
|
| 5844 |
build = ["cmake (>=3.20)", "lit"]
|
| 5845 |
+
tests = ["autopep8", "isort", "llnl-hatchet", "numpy", "pytest", "pytest-forked", "pytest-xdist", "scipy (>=1.7.1)"]
|
| 5846 |
tutorials = ["matplotlib", "pandas", "tabulate"]
|
| 5847 |
|
| 5848 |
[[package]]
|
|
|
|
| 6505 |
[metadata]
|
| 6506 |
lock-version = "2.1"
|
| 6507 |
python-versions = "^3.10"
|
| 6508 |
+
content-hash = "c18debb8d18aec4081c31ff32f9dc2bde6f4c0189f1d7647bb6061f685e0e319"
|
pyproject.toml
CHANGED
|
@@ -22,11 +22,11 @@ pydantic = "^2.4.2"
|
|
| 22 |
pydantic-settings = "^2.0.3"
|
| 23 |
transformers = "^4.45.2"
|
| 24 |
python-dotenv = "^1.0.0"
|
| 25 |
-
torch = "^2.
|
| 26 |
tqdm = "^4.66.1"
|
| 27 |
ftfy = "^6.1.1"
|
| 28 |
rapidfuzz = "^3.8.1"
|
| 29 |
-
surya-ocr = "^0.14.
|
| 30 |
regex = "^2024.4.28"
|
| 31 |
pdftext = "~0.6.2"
|
| 32 |
markdownify = "^0.13.1"
|
|
|
|
| 22 |
pydantic-settings = "^2.0.3"
|
| 23 |
transformers = "^4.45.2"
|
| 24 |
python-dotenv = "^1.0.0"
|
| 25 |
+
torch = "^2.7.0"
|
| 26 |
tqdm = "^4.66.1"
|
| 27 |
ftfy = "^6.1.1"
|
| 28 |
rapidfuzz = "^3.8.1"
|
| 29 |
+
surya-ocr = "^0.14.2"
|
| 30 |
regex = "^2024.4.28"
|
| 31 |
pdftext = "~0.6.2"
|
| 32 |
markdownify = "^0.13.1"
|
tests/config/test_config.py
CHANGED
|
@@ -53,7 +53,7 @@ def test_config_none():
|
|
| 53 |
|
| 54 |
for key in crawler.attr_set:
|
| 55 |
# We force some options to become flags for ease of use on the CLI
|
| 56 |
-
value = None
|
| 57 |
assert kwargs.get(key) is value
|
| 58 |
|
| 59 |
|
|
@@ -64,3 +64,13 @@ def test_config_llm():
|
|
| 64 |
|
| 65 |
# Validate kwarg capturing
|
| 66 |
assert config_dict["use_llm"]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 53 |
|
| 54 |
for key in crawler.attr_set:
|
| 55 |
# We force some options to become flags for ease of use on the CLI
|
| 56 |
+
value = None
|
| 57 |
assert kwargs.get(key) is value
|
| 58 |
|
| 59 |
|
|
|
|
| 64 |
|
| 65 |
# Validate kwarg capturing
|
| 66 |
assert config_dict["use_llm"]
|
| 67 |
+
|
| 68 |
+
|
| 69 |
+
def test_config_force_ocr():
|
| 70 |
+
kwargs = capture_kwargs(["test", "--force_ocr", "--format_lines"])
|
| 71 |
+
parser = ConfigParser(kwargs)
|
| 72 |
+
config_dict = parser.generate_config_dict()
|
| 73 |
+
|
| 74 |
+
# Validate kwarg capturing
|
| 75 |
+
assert config_dict["force_ocr"]
|
| 76 |
+
assert config_dict["format_lines"]
|