Vik Paruchuri
commited on
Commit
·
5038c82
1
Parent(s):
7427f88
Review comments
Browse files- marker/processors/line_numbers.py +2 -2
- marker/processors/text.py +2 -2
- marker/schema/blocks/base.py +4 -0
- poetry.lock +161 -161
- pyproject.toml +0 -1
- tests/conftest.py +1 -17
- tests/processors/test_ignoretext.py +19 -0
marker/processors/line_numbers.py
CHANGED
|
@@ -18,14 +18,14 @@ class LineNumbersProcessor(BaseProcessor):
|
|
| 18 |
if block.structure is None:
|
| 19 |
continue
|
| 20 |
|
| 21 |
-
all_lines =
|
| 22 |
if len(all_lines) < self.min_lines_in_block:
|
| 23 |
continue
|
| 24 |
|
| 25 |
starts_with_number = []
|
| 26 |
ends_with_number = []
|
| 27 |
for line in all_lines:
|
| 28 |
-
spans =
|
| 29 |
if len(spans) < 2:
|
| 30 |
starts_with_number.append(False)
|
| 31 |
ends_with_number.append(False)
|
|
|
|
| 18 |
if block.structure is None:
|
| 19 |
continue
|
| 20 |
|
| 21 |
+
all_lines = block.structure_blocks(document)
|
| 22 |
if len(all_lines) < self.min_lines_in_block:
|
| 23 |
continue
|
| 24 |
|
| 25 |
starts_with_number = []
|
| 26 |
ends_with_number = []
|
| 27 |
for line in all_lines:
|
| 28 |
+
spans = line.structure_blocks(document)
|
| 29 |
if len(spans) < 2:
|
| 30 |
starts_with_number.append(False)
|
| 31 |
ends_with_number.append(False)
|
marker/processors/text.py
CHANGED
|
@@ -49,7 +49,7 @@ class TextProcessor(BaseProcessor):
|
|
| 49 |
if next_block.structure is None: # This is odd though, why do we have text blocks with no structure?
|
| 50 |
continue
|
| 51 |
|
| 52 |
-
new_block_lines =
|
| 53 |
else: # page break
|
| 54 |
next_page = document.get_next_page(page)
|
| 55 |
if next_page is None:
|
|
@@ -80,7 +80,7 @@ class TextProcessor(BaseProcessor):
|
|
| 80 |
min_x = math.ceil(min([l.polygon.x_start for l in new_block_lines]))
|
| 81 |
next_block_starts_indented = new_block_lines[0].polygon.x_start > min_x
|
| 82 |
|
| 83 |
-
lines: List[Line] =
|
| 84 |
max_x = math.floor(max([l.polygon.x_end for l in lines]))
|
| 85 |
last_line_is_full_width = lines[-1].polygon.x_end >= max_x
|
| 86 |
|
|
|
|
| 49 |
if next_block.structure is None: # This is odd though, why do we have text blocks with no structure?
|
| 50 |
continue
|
| 51 |
|
| 52 |
+
new_block_lines = next_block.structure_blocks(document)
|
| 53 |
else: # page break
|
| 54 |
next_page = document.get_next_page(page)
|
| 55 |
if next_page is None:
|
|
|
|
| 80 |
min_x = math.ceil(min([l.polygon.x_start for l in new_block_lines]))
|
| 81 |
next_block_starts_indented = new_block_lines[0].polygon.x_start > min_x
|
| 82 |
|
| 83 |
+
lines: List[Line] = block.structure_blocks(document)
|
| 84 |
max_x = math.floor(max([l.polygon.x_end for l in lines]))
|
| 85 |
last_line_is_full_width = lines[-1].polygon.x_end >= max_x
|
| 86 |
|
marker/schema/blocks/base.py
CHANGED
|
@@ -74,6 +74,9 @@ class Block(BaseModel):
|
|
| 74 |
block_type=self.block_type
|
| 75 |
)
|
| 76 |
|
|
|
|
|
|
|
|
|
|
| 77 |
def add_structure(self, block: Block):
|
| 78 |
if self.structure is None:
|
| 79 |
self.structure = [block.id]
|
|
@@ -128,6 +131,7 @@ class Block(BaseModel):
|
|
| 128 |
def contained_blocks(self, document: Document, block_types: Sequence[BlockTypes] = None):
|
| 129 |
if self.structure is None:
|
| 130 |
return []
|
|
|
|
| 131 |
blocks = []
|
| 132 |
for block_id in self.structure:
|
| 133 |
block = document.get_block(block_id)
|
|
|
|
| 74 |
block_type=self.block_type
|
| 75 |
)
|
| 76 |
|
| 77 |
+
def structure_blocks(self, document_page) -> List[Block]:
|
| 78 |
+
return [document_page.get_block(block_id) for block_id in self.structure]
|
| 79 |
+
|
| 80 |
def add_structure(self, block: Block):
|
| 81 |
if self.structure is None:
|
| 82 |
self.structure = [block.id]
|
|
|
|
| 131 |
def contained_blocks(self, document: Document, block_types: Sequence[BlockTypes] = None):
|
| 132 |
if self.structure is None:
|
| 133 |
return []
|
| 134 |
+
|
| 135 |
blocks = []
|
| 136 |
for block_id in self.structure:
|
| 137 |
block = document.get_block(block_id)
|
poetry.lock
CHANGED
|
@@ -13,87 +13,87 @@ files = [
|
|
| 13 |
|
| 14 |
[[package]]
|
| 15 |
name = "aiohttp"
|
| 16 |
-
version = "3.11.
|
| 17 |
description = "Async http client/server framework (asyncio)"
|
| 18 |
optional = false
|
| 19 |
python-versions = ">=3.9"
|
| 20 |
files = [
|
| 21 |
-
{file = "aiohttp-3.11.
|
| 22 |
-
{file = "aiohttp-3.11.
|
| 23 |
-
{file = "aiohttp-3.11.
|
| 24 |
-
{file = "aiohttp-3.11.
|
| 25 |
-
{file = "aiohttp-3.11.
|
| 26 |
-
{file = "aiohttp-3.11.
|
| 27 |
-
{file = "aiohttp-3.11.
|
| 28 |
-
{file = "aiohttp-3.11.
|
| 29 |
-
{file = "aiohttp-3.11.
|
| 30 |
-
{file = "aiohttp-3.11.
|
| 31 |
-
{file = "aiohttp-3.11.
|
| 32 |
-
{file = "aiohttp-3.11.
|
| 33 |
-
{file = "aiohttp-3.11.
|
| 34 |
-
{file = "aiohttp-3.11.
|
| 35 |
-
{file = "aiohttp-3.11.
|
| 36 |
-
{file = "aiohttp-3.11.
|
| 37 |
-
{file = "aiohttp-3.11.
|
| 38 |
-
{file = "aiohttp-3.11.
|
| 39 |
-
{file = "aiohttp-3.11.
|
| 40 |
-
{file = "aiohttp-3.11.
|
| 41 |
-
{file = "aiohttp-3.11.
|
| 42 |
-
{file = "aiohttp-3.11.
|
| 43 |
-
{file = "aiohttp-3.11.
|
| 44 |
-
{file = "aiohttp-3.11.
|
| 45 |
-
{file = "aiohttp-3.11.
|
| 46 |
-
{file = "aiohttp-3.11.
|
| 47 |
-
{file = "aiohttp-3.11.
|
| 48 |
-
{file = "aiohttp-3.11.
|
| 49 |
-
{file = "aiohttp-3.11.
|
| 50 |
-
{file = "aiohttp-3.11.
|
| 51 |
-
{file = "aiohttp-3.11.
|
| 52 |
-
{file = "aiohttp-3.11.
|
| 53 |
-
{file = "aiohttp-3.11.
|
| 54 |
-
{file = "aiohttp-3.11.
|
| 55 |
-
{file = "aiohttp-3.11.
|
| 56 |
-
{file = "aiohttp-3.11.
|
| 57 |
-
{file = "aiohttp-3.11.
|
| 58 |
-
{file = "aiohttp-3.11.
|
| 59 |
-
{file = "aiohttp-3.11.
|
| 60 |
-
{file = "aiohttp-3.11.
|
| 61 |
-
{file = "aiohttp-3.11.
|
| 62 |
-
{file = "aiohttp-3.11.
|
| 63 |
-
{file = "aiohttp-3.11.
|
| 64 |
-
{file = "aiohttp-3.11.
|
| 65 |
-
{file = "aiohttp-3.11.
|
| 66 |
-
{file = "aiohttp-3.11.
|
| 67 |
-
{file = "aiohttp-3.11.
|
| 68 |
-
{file = "aiohttp-3.11.
|
| 69 |
-
{file = "aiohttp-3.11.
|
| 70 |
-
{file = "aiohttp-3.11.
|
| 71 |
-
{file = "aiohttp-3.11.
|
| 72 |
-
{file = "aiohttp-3.11.
|
| 73 |
-
{file = "aiohttp-3.11.
|
| 74 |
-
{file = "aiohttp-3.11.
|
| 75 |
-
{file = "aiohttp-3.11.
|
| 76 |
-
{file = "aiohttp-3.11.
|
| 77 |
-
{file = "aiohttp-3.11.
|
| 78 |
-
{file = "aiohttp-3.11.
|
| 79 |
-
{file = "aiohttp-3.11.
|
| 80 |
-
{file = "aiohttp-3.11.
|
| 81 |
-
{file = "aiohttp-3.11.
|
| 82 |
-
{file = "aiohttp-3.11.
|
| 83 |
-
{file = "aiohttp-3.11.
|
| 84 |
-
{file = "aiohttp-3.11.
|
| 85 |
-
{file = "aiohttp-3.11.
|
| 86 |
-
{file = "aiohttp-3.11.
|
| 87 |
-
{file = "aiohttp-3.11.
|
| 88 |
-
{file = "aiohttp-3.11.
|
| 89 |
-
{file = "aiohttp-3.11.
|
| 90 |
-
{file = "aiohttp-3.11.
|
| 91 |
-
{file = "aiohttp-3.11.
|
| 92 |
-
{file = "aiohttp-3.11.
|
| 93 |
-
{file = "aiohttp-3.11.
|
| 94 |
-
{file = "aiohttp-3.11.
|
| 95 |
-
{file = "aiohttp-3.11.
|
| 96 |
-
{file = "aiohttp-3.11.
|
| 97 |
]
|
| 98 |
|
| 99 |
[package.dependencies]
|
|
@@ -5134,93 +5134,93 @@ files = [
|
|
| 5134 |
|
| 5135 |
[[package]]
|
| 5136 |
name = "yarl"
|
| 5137 |
-
version = "1.
|
| 5138 |
description = "Yet another URL library"
|
| 5139 |
optional = false
|
| 5140 |
python-versions = ">=3.9"
|
| 5141 |
files = [
|
| 5142 |
-
{file = "yarl-1.
|
| 5143 |
-
{file = "yarl-1.
|
| 5144 |
-
{file = "yarl-1.
|
| 5145 |
-
{file = "yarl-1.
|
| 5146 |
-
{file = "yarl-1.
|
| 5147 |
-
{file = "yarl-1.
|
| 5148 |
-
{file = "yarl-1.
|
| 5149 |
-
{file = "yarl-1.
|
| 5150 |
-
{file = "yarl-1.
|
| 5151 |
-
{file = "yarl-1.
|
| 5152 |
-
{file = "yarl-1.
|
| 5153 |
-
{file = "yarl-1.
|
| 5154 |
-
{file = "yarl-1.
|
| 5155 |
-
{file = "yarl-1.
|
| 5156 |
-
{file = "yarl-1.
|
| 5157 |
-
{file = "yarl-1.
|
| 5158 |
-
{file = "yarl-1.
|
| 5159 |
-
{file = "yarl-1.
|
| 5160 |
-
{file = "yarl-1.
|
| 5161 |
-
{file = "yarl-1.
|
| 5162 |
-
{file = "yarl-1.
|
| 5163 |
-
{file = "yarl-1.
|
| 5164 |
-
{file = "yarl-1.
|
| 5165 |
-
{file = "yarl-1.
|
| 5166 |
-
{file = "yarl-1.
|
| 5167 |
-
{file = "yarl-1.
|
| 5168 |
-
{file = "yarl-1.
|
| 5169 |
-
{file = "yarl-1.
|
| 5170 |
-
{file = "yarl-1.
|
| 5171 |
-
{file = "yarl-1.
|
| 5172 |
-
{file = "yarl-1.
|
| 5173 |
-
{file = "yarl-1.
|
| 5174 |
-
{file = "yarl-1.
|
| 5175 |
-
{file = "yarl-1.
|
| 5176 |
-
{file = "yarl-1.
|
| 5177 |
-
{file = "yarl-1.
|
| 5178 |
-
{file = "yarl-1.
|
| 5179 |
-
{file = "yarl-1.
|
| 5180 |
-
{file = "yarl-1.
|
| 5181 |
-
{file = "yarl-1.
|
| 5182 |
-
{file = "yarl-1.
|
| 5183 |
-
{file = "yarl-1.
|
| 5184 |
-
{file = "yarl-1.
|
| 5185 |
-
{file = "yarl-1.
|
| 5186 |
-
{file = "yarl-1.
|
| 5187 |
-
{file = "yarl-1.
|
| 5188 |
-
{file = "yarl-1.
|
| 5189 |
-
{file = "yarl-1.
|
| 5190 |
-
{file = "yarl-1.
|
| 5191 |
-
{file = "yarl-1.
|
| 5192 |
-
{file = "yarl-1.
|
| 5193 |
-
{file = "yarl-1.
|
| 5194 |
-
{file = "yarl-1.
|
| 5195 |
-
{file = "yarl-1.
|
| 5196 |
-
{file = "yarl-1.
|
| 5197 |
-
{file = "yarl-1.
|
| 5198 |
-
{file = "yarl-1.
|
| 5199 |
-
{file = "yarl-1.
|
| 5200 |
-
{file = "yarl-1.
|
| 5201 |
-
{file = "yarl-1.
|
| 5202 |
-
{file = "yarl-1.
|
| 5203 |
-
{file = "yarl-1.
|
| 5204 |
-
{file = "yarl-1.
|
| 5205 |
-
{file = "yarl-1.
|
| 5206 |
-
{file = "yarl-1.
|
| 5207 |
-
{file = "yarl-1.
|
| 5208 |
-
{file = "yarl-1.
|
| 5209 |
-
{file = "yarl-1.
|
| 5210 |
-
{file = "yarl-1.
|
| 5211 |
-
{file = "yarl-1.
|
| 5212 |
-
{file = "yarl-1.
|
| 5213 |
-
{file = "yarl-1.
|
| 5214 |
-
{file = "yarl-1.
|
| 5215 |
-
{file = "yarl-1.
|
| 5216 |
-
{file = "yarl-1.
|
| 5217 |
-
{file = "yarl-1.
|
| 5218 |
-
{file = "yarl-1.
|
| 5219 |
-
{file = "yarl-1.
|
| 5220 |
-
{file = "yarl-1.
|
| 5221 |
-
{file = "yarl-1.
|
| 5222 |
-
{file = "yarl-1.
|
| 5223 |
-
{file = "yarl-1.
|
| 5224 |
]
|
| 5225 |
|
| 5226 |
[package.dependencies]
|
|
@@ -5231,4 +5231,4 @@ propcache = ">=0.2.0"
|
|
| 5231 |
[metadata]
|
| 5232 |
lock-version = "2.0"
|
| 5233 |
python-versions = "^3.10"
|
| 5234 |
-
content-hash = "
|
|
|
|
| 13 |
|
| 14 |
[[package]]
|
| 15 |
name = "aiohttp"
|
| 16 |
+
version = "3.11.7"
|
| 17 |
description = "Async http client/server framework (asyncio)"
|
| 18 |
optional = false
|
| 19 |
python-versions = ">=3.9"
|
| 20 |
files = [
|
| 21 |
+
{file = "aiohttp-3.11.7-cp310-cp310-macosx_10_9_universal2.whl", hash = "sha256:8bedb1f6cb919af3b6353921c71281b1491f948ca64408871465d889b4ee1b66"},
|
| 22 |
+
{file = "aiohttp-3.11.7-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:f5022504adab881e2d801a88b748ea63f2a9d130e0b2c430824682a96f6534be"},
|
| 23 |
+
{file = "aiohttp-3.11.7-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:e22d1721c978a6494adc824e0916f9d187fa57baeda34b55140315fa2f740184"},
|
| 24 |
+
{file = "aiohttp-3.11.7-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:e993676c71288618eb07e20622572b1250d8713e7e00ab3aabae28cb70f3640d"},
|
| 25 |
+
{file = "aiohttp-3.11.7-cp310-cp310-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:e13a05db87d3b241c186d0936808d0e4e12decc267c617d54e9c643807e968b6"},
|
| 26 |
+
{file = "aiohttp-3.11.7-cp310-cp310-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:4ba8d043fed7ffa117024d7ba66fdea011c0e7602327c6d73cacaea38abe4491"},
|
| 27 |
+
{file = "aiohttp-3.11.7-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:dda3ed0a7869d2fa16aa41f9961ade73aa2c2e3b2fcb0a352524e7b744881889"},
|
| 28 |
+
{file = "aiohttp-3.11.7-cp310-cp310-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:43bfd25113c1e98aec6c70e26d5f4331efbf4aa9037ba9ad88f090853bf64d7f"},
|
| 29 |
+
{file = "aiohttp-3.11.7-cp310-cp310-musllinux_1_2_aarch64.whl", hash = "sha256:3dd3e7e7c9ef3e7214f014f1ae260892286647b3cf7c7f1b644a568fd410f8ca"},
|
| 30 |
+
{file = "aiohttp-3.11.7-cp310-cp310-musllinux_1_2_i686.whl", hash = "sha256:78c657ece7a73b976905ab9ec8be9ef2df12ed8984c24598a1791c58ce3b4ce4"},
|
| 31 |
+
{file = "aiohttp-3.11.7-cp310-cp310-musllinux_1_2_ppc64le.whl", hash = "sha256:db70a47987e34494b451a334605bee57a126fe8d290511349e86810b4be53b01"},
|
| 32 |
+
{file = "aiohttp-3.11.7-cp310-cp310-musllinux_1_2_s390x.whl", hash = "sha256:9e67531370a3b07e49b280c1f8c2df67985c790ad2834d1b288a2f13cd341c5f"},
|
| 33 |
+
{file = "aiohttp-3.11.7-cp310-cp310-musllinux_1_2_x86_64.whl", hash = "sha256:9202f184cc0582b1db15056f2225ab4c1e3dac4d9ade50dd0613ac3c46352ac2"},
|
| 34 |
+
{file = "aiohttp-3.11.7-cp310-cp310-win32.whl", hash = "sha256:2257bdd5cf54a4039a4337162cd8048f05a724380a2283df34620f55d4e29341"},
|
| 35 |
+
{file = "aiohttp-3.11.7-cp310-cp310-win_amd64.whl", hash = "sha256:b7215bf2b53bc6cb35808149980c2ae80a4ae4e273890ac85459c014d5aa60ac"},
|
| 36 |
+
{file = "aiohttp-3.11.7-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:cea52d11e02123f125f9055dfe0ccf1c3857225fb879e4a944fae12989e2aef2"},
|
| 37 |
+
{file = "aiohttp-3.11.7-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:3ce18f703b7298e7f7633efd6a90138d99a3f9a656cb52c1201e76cb5d79cf08"},
|
| 38 |
+
{file = "aiohttp-3.11.7-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:670847ee6aeb3a569cd7cdfbe0c3bec1d44828bbfbe78c5d305f7f804870ef9e"},
|
| 39 |
+
{file = "aiohttp-3.11.7-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:4dda726f89bfa5c465ba45b76515135a3ece0088dfa2da49b8bb278f3bdeea12"},
|
| 40 |
+
{file = "aiohttp-3.11.7-cp311-cp311-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:c25b74a811dba37c7ea6a14d99eb9402d89c8d739d50748a75f3cf994cf19c43"},
|
| 41 |
+
{file = "aiohttp-3.11.7-cp311-cp311-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:e5522ee72f95661e79db691310290c4618b86dff2d9b90baedf343fd7a08bf79"},
|
| 42 |
+
{file = "aiohttp-3.11.7-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:1fbf41a6bbc319a7816ae0f0177c265b62f2a59ad301a0e49b395746eb2a9884"},
|
| 43 |
+
{file = "aiohttp-3.11.7-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:59ee1925b5a5efdf6c4e7be51deee93984d0ac14a6897bd521b498b9916f1544"},
|
| 44 |
+
{file = "aiohttp-3.11.7-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:24054fce8c6d6f33a3e35d1c603ef1b91bbcba73e3f04a22b4f2f27dac59b347"},
|
| 45 |
+
{file = "aiohttp-3.11.7-cp311-cp311-musllinux_1_2_i686.whl", hash = "sha256:351849aca2c6f814575c1a485c01c17a4240413f960df1bf9f5deb0003c61a53"},
|
| 46 |
+
{file = "aiohttp-3.11.7-cp311-cp311-musllinux_1_2_ppc64le.whl", hash = "sha256:12724f3a211fa243570e601f65a8831372caf1a149d2f1859f68479f07efec3d"},
|
| 47 |
+
{file = "aiohttp-3.11.7-cp311-cp311-musllinux_1_2_s390x.whl", hash = "sha256:7ea4490360b605804bea8173d2d086b6c379d6bb22ac434de605a9cbce006e7d"},
|
| 48 |
+
{file = "aiohttp-3.11.7-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:e0bf378db07df0a713a1e32381a1b277e62ad106d0dbe17b5479e76ec706d720"},
|
| 49 |
+
{file = "aiohttp-3.11.7-cp311-cp311-win32.whl", hash = "sha256:cd8d62cab363dfe713067027a5adb4907515861f1e4ce63e7be810b83668b847"},
|
| 50 |
+
{file = "aiohttp-3.11.7-cp311-cp311-win_amd64.whl", hash = "sha256:bf0e6cce113596377cadda4e3ac5fb89f095bd492226e46d91b4baef1dd16f60"},
|
| 51 |
+
{file = "aiohttp-3.11.7-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:4bb7493c3e3a36d3012b8564bd0e2783259ddd7ef3a81a74f0dbfa000fce48b7"},
|
| 52 |
+
{file = "aiohttp-3.11.7-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:e143b0ef9cb1a2b4f74f56d4fbe50caa7c2bb93390aff52f9398d21d89bc73ea"},
|
| 53 |
+
{file = "aiohttp-3.11.7-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:f7c58a240260822dc07f6ae32a0293dd5bccd618bb2d0f36d51c5dbd526f89c0"},
|
| 54 |
+
{file = "aiohttp-3.11.7-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:8d20cfe63a1c135d26bde8c1d0ea46fd1200884afbc523466d2f1cf517d1fe33"},
|
| 55 |
+
{file = "aiohttp-3.11.7-cp312-cp312-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:12e4d45847a174f77b2b9919719203769f220058f642b08504cf8b1cf185dacf"},
|
| 56 |
+
{file = "aiohttp-3.11.7-cp312-cp312-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:cf4efa2d01f697a7dbd0509891a286a4af0d86902fc594e20e3b1712c28c0106"},
|
| 57 |
+
{file = "aiohttp-3.11.7-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:9ee6a4cdcbf54b8083dc9723cdf5f41f722c00db40ccf9ec2616e27869151129"},
|
| 58 |
+
{file = "aiohttp-3.11.7-cp312-cp312-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:c6095aaf852c34f42e1bd0cf0dc32d1e4b48a90bfb5054abdbb9d64b36acadcb"},
|
| 59 |
+
{file = "aiohttp-3.11.7-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:1cf03d27885f8c5ebf3993a220cc84fc66375e1e6e812731f51aab2b2748f4a6"},
|
| 60 |
+
{file = "aiohttp-3.11.7-cp312-cp312-musllinux_1_2_i686.whl", hash = "sha256:1a17f6a230f81eb53282503823f59d61dff14fb2a93847bf0399dc8e87817307"},
|
| 61 |
+
{file = "aiohttp-3.11.7-cp312-cp312-musllinux_1_2_ppc64le.whl", hash = "sha256:481f10a1a45c5f4c4a578bbd74cff22eb64460a6549819242a87a80788461fba"},
|
| 62 |
+
{file = "aiohttp-3.11.7-cp312-cp312-musllinux_1_2_s390x.whl", hash = "sha256:db37248535d1ae40735d15bdf26ad43be19e3d93ab3f3dad8507eb0f85bb8124"},
|
| 63 |
+
{file = "aiohttp-3.11.7-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:9d18a8b44ec8502a7fde91446cd9c9b95ce7c49f1eacc1fb2358b8907d4369fd"},
|
| 64 |
+
{file = "aiohttp-3.11.7-cp312-cp312-win32.whl", hash = "sha256:3d1c9c15d3999107cbb9b2d76ca6172e6710a12fda22434ee8bd3f432b7b17e8"},
|
| 65 |
+
{file = "aiohttp-3.11.7-cp312-cp312-win_amd64.whl", hash = "sha256:018f1b04883a12e77e7fc161934c0f298865d3a484aea536a6a2ca8d909f0ba0"},
|
| 66 |
+
{file = "aiohttp-3.11.7-cp313-cp313-macosx_10_13_universal2.whl", hash = "sha256:241a6ca732d2766836d62c58c49ca7a93d08251daef0c1e3c850df1d1ca0cbc4"},
|
| 67 |
+
{file = "aiohttp-3.11.7-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:aa3705a8d14de39898da0fbad920b2a37b7547c3afd2a18b9b81f0223b7d0f68"},
|
| 68 |
+
{file = "aiohttp-3.11.7-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:9acfc7f652b31853eed3b92095b0acf06fd5597eeea42e939bd23a17137679d5"},
|
| 69 |
+
{file = "aiohttp-3.11.7-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:dcefcf2915a2dbdbce37e2fc1622129a1918abfe3d06721ce9f6cdac9b6d2eaa"},
|
| 70 |
+
{file = "aiohttp-3.11.7-cp313-cp313-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:c1f6490dd1862af5aae6cfcf2a274bffa9a5b32a8f5acb519a7ecf5a99a88866"},
|
| 71 |
+
{file = "aiohttp-3.11.7-cp313-cp313-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:f1ac5462582d6561c1c1708853a9faf612ff4e5ea5e679e99be36143d6eabd8e"},
|
| 72 |
+
{file = "aiohttp-3.11.7-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:4c1a6309005acc4b2bcc577ba3b9169fea52638709ffacbd071f3503264620da"},
|
| 73 |
+
{file = "aiohttp-3.11.7-cp313-cp313-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:f5b973cce96793725ef63eb449adfb74f99c043c718acb76e0d2a447ae369962"},
|
| 74 |
+
{file = "aiohttp-3.11.7-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:ce91a24aac80de6be8512fb1c4838a9881aa713f44f4e91dd7bb3b34061b497d"},
|
| 75 |
+
{file = "aiohttp-3.11.7-cp313-cp313-musllinux_1_2_i686.whl", hash = "sha256:875f7100ce0e74af51d4139495eec4025affa1a605280f23990b6434b81df1bd"},
|
| 76 |
+
{file = "aiohttp-3.11.7-cp313-cp313-musllinux_1_2_ppc64le.whl", hash = "sha256:c171fc35d3174bbf4787381716564042a4cbc008824d8195eede3d9b938e29a8"},
|
| 77 |
+
{file = "aiohttp-3.11.7-cp313-cp313-musllinux_1_2_s390x.whl", hash = "sha256:ee9afa1b0d2293c46954f47f33e150798ad68b78925e3710044e0d67a9487791"},
|
| 78 |
+
{file = "aiohttp-3.11.7-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:8360c7cc620abb320e1b8d603c39095101391a82b1d0be05fb2225471c9c5c52"},
|
| 79 |
+
{file = "aiohttp-3.11.7-cp313-cp313-win32.whl", hash = "sha256:7a9318da4b4ada9a67c1dd84d1c0834123081e746bee311a16bb449f363d965e"},
|
| 80 |
+
{file = "aiohttp-3.11.7-cp313-cp313-win_amd64.whl", hash = "sha256:fc6da202068e0a268e298d7cd09b6e9f3997736cd9b060e2750963754552a0a9"},
|
| 81 |
+
{file = "aiohttp-3.11.7-cp39-cp39-macosx_10_9_universal2.whl", hash = "sha256:17829f37c0d31d89aa6b8b010475a10233774771f9b6dc2cc352ea4f8ce95d9a"},
|
| 82 |
+
{file = "aiohttp-3.11.7-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:d6177077a31b1aecfc3c9070bd2f11419dbb4a70f30f4c65b124714f525c2e48"},
|
| 83 |
+
{file = "aiohttp-3.11.7-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:badda65ac99555791eed75e234afb94686ed2317670c68bff8a4498acdaee935"},
|
| 84 |
+
{file = "aiohttp-3.11.7-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:0de6466b9d742b4ee56fe1b2440706e225eb48c77c63152b1584864a236e7a50"},
|
| 85 |
+
{file = "aiohttp-3.11.7-cp39-cp39-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:04b0cc74d5a882c9dacaeeccc1444f0233212b6f5be8bc90833feef1e1ce14b9"},
|
| 86 |
+
{file = "aiohttp-3.11.7-cp39-cp39-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:28c7af3e50e5903d21d7b935aceed901cc2475463bc16ddd5587653548661fdb"},
|
| 87 |
+
{file = "aiohttp-3.11.7-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:c63f898f683d1379b9be5afc3dd139e20b30b0b1e0bf69a3fc3681f364cf1629"},
|
| 88 |
+
{file = "aiohttp-3.11.7-cp39-cp39-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:fdadc3f6a32d6eca45f9a900a254757fd7855dfb2d8f8dcf0e88f0fae3ff8eb1"},
|
| 89 |
+
{file = "aiohttp-3.11.7-cp39-cp39-musllinux_1_2_aarch64.whl", hash = "sha256:d329300fb23e14ed1f8c6d688dfd867d1dcc3b1d7cd49b7f8c5b44e797ce0932"},
|
| 90 |
+
{file = "aiohttp-3.11.7-cp39-cp39-musllinux_1_2_i686.whl", hash = "sha256:5578cf40440eafcb054cf859964bc120ab52ebe0e0562d2b898126d868749629"},
|
| 91 |
+
{file = "aiohttp-3.11.7-cp39-cp39-musllinux_1_2_ppc64le.whl", hash = "sha256:7b2f8107a3c329789f3c00b2daad0e35f548d0a55cda6291579136622099a46e"},
|
| 92 |
+
{file = "aiohttp-3.11.7-cp39-cp39-musllinux_1_2_s390x.whl", hash = "sha256:43dd89a6194f6ab02a3fe36b09e42e2df19c211fc2050ce37374d96f39604997"},
|
| 93 |
+
{file = "aiohttp-3.11.7-cp39-cp39-musllinux_1_2_x86_64.whl", hash = "sha256:d2fa6fc7cc865d26ff42480ac9b52b8c9b7da30a10a6442a9cdf429de840e949"},
|
| 94 |
+
{file = "aiohttp-3.11.7-cp39-cp39-win32.whl", hash = "sha256:a7d9a606355655617fee25dd7e54d3af50804d002f1fd3118dd6312d26692d70"},
|
| 95 |
+
{file = "aiohttp-3.11.7-cp39-cp39-win_amd64.whl", hash = "sha256:53c921b58fdc6485d6b2603e0132bb01cd59b8f0620ffc0907f525e0ba071687"},
|
| 96 |
+
{file = "aiohttp-3.11.7.tar.gz", hash = "sha256:01a8aca4af3da85cea5c90141d23f4b0eee3cbecfd33b029a45a80f28c66c668"},
|
| 97 |
]
|
| 98 |
|
| 99 |
[package.dependencies]
|
|
|
|
| 5134 |
|
| 5135 |
[[package]]
|
| 5136 |
name = "yarl"
|
| 5137 |
+
version = "1.18.0"
|
| 5138 |
description = "Yet another URL library"
|
| 5139 |
optional = false
|
| 5140 |
python-versions = ">=3.9"
|
| 5141 |
files = [
|
| 5142 |
+
{file = "yarl-1.18.0-cp310-cp310-macosx_10_9_universal2.whl", hash = "sha256:074fee89caab89a97e18ef5f29060ef61ba3cae6cd77673acc54bfdd3214b7b7"},
|
| 5143 |
+
{file = "yarl-1.18.0-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:b026cf2c32daf48d90c0c4e406815c3f8f4cfe0c6dfccb094a9add1ff6a0e41a"},
|
| 5144 |
+
{file = "yarl-1.18.0-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:ae38bd86eae3ba3d2ce5636cc9e23c80c9db2e9cb557e40b98153ed102b5a736"},
|
| 5145 |
+
{file = "yarl-1.18.0-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:685cc37f3f307c6a8e879986c6d85328f4c637f002e219f50e2ef66f7e062c1d"},
|
| 5146 |
+
{file = "yarl-1.18.0-cp310-cp310-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:8254dbfce84ee5d1e81051ee7a0f1536c108ba294c0fdb5933476398df0654f3"},
|
| 5147 |
+
{file = "yarl-1.18.0-cp310-cp310-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:20de4a8b04de70c49698dc2390b7fd2d18d424d3b876371f9b775e2b462d4b41"},
|
| 5148 |
+
{file = "yarl-1.18.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:b0a2074a37285570d54b55820687de3d2f2b9ecf1b714e482e48c9e7c0402038"},
|
| 5149 |
+
{file = "yarl-1.18.0-cp310-cp310-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:3f576ed278860df2721a5d57da3381040176ef1d07def9688a385c8330db61a1"},
|
| 5150 |
+
{file = "yarl-1.18.0-cp310-cp310-musllinux_1_2_aarch64.whl", hash = "sha256:3a3709450a574d61be6ac53d582496014342ea34876af8dc17cc16da32826c9a"},
|
| 5151 |
+
{file = "yarl-1.18.0-cp310-cp310-musllinux_1_2_armv7l.whl", hash = "sha256:bd80ed29761490c622edde5dd70537ca8c992c2952eb62ed46984f8eff66d6e8"},
|
| 5152 |
+
{file = "yarl-1.18.0-cp310-cp310-musllinux_1_2_i686.whl", hash = "sha256:32141e13a1d5a48525e519c9197d3f4d9744d818d5c7d6547524cc9eccc8971e"},
|
| 5153 |
+
{file = "yarl-1.18.0-cp310-cp310-musllinux_1_2_ppc64le.whl", hash = "sha256:8b8d3e4e014fb4274f1c5bf61511d2199e263909fb0b8bda2a7428b0894e8dc6"},
|
| 5154 |
+
{file = "yarl-1.18.0-cp310-cp310-musllinux_1_2_s390x.whl", hash = "sha256:701bb4a8f4de191c8c0cc9a1e6d5142f4df880e9d1210e333b829ca9425570ed"},
|
| 5155 |
+
{file = "yarl-1.18.0-cp310-cp310-musllinux_1_2_x86_64.whl", hash = "sha256:a45d94075ac0647621eaaf693c8751813a3eccac455d423f473ffed38c8ac5c9"},
|
| 5156 |
+
{file = "yarl-1.18.0-cp310-cp310-win32.whl", hash = "sha256:34176bfb082add67cb2a20abd85854165540891147f88b687a5ed0dc225750a0"},
|
| 5157 |
+
{file = "yarl-1.18.0-cp310-cp310-win_amd64.whl", hash = "sha256:73553bbeea7d6ec88c08ad8027f4e992798f0abc459361bf06641c71972794dc"},
|
| 5158 |
+
{file = "yarl-1.18.0-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:b8e8c516dc4e1a51d86ac975b0350735007e554c962281c432eaa5822aa9765c"},
|
| 5159 |
+
{file = "yarl-1.18.0-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:2e6b4466714a73f5251d84b471475850954f1fa6acce4d3f404da1d55d644c34"},
|
| 5160 |
+
{file = "yarl-1.18.0-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:c893f8c1a6d48b25961e00922724732d00b39de8bb0b451307482dc87bddcd74"},
|
| 5161 |
+
{file = "yarl-1.18.0-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:13aaf2bdbc8c86ddce48626b15f4987f22e80d898818d735b20bd58f17292ee8"},
|
| 5162 |
+
{file = "yarl-1.18.0-cp311-cp311-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:dd21c0128e301851de51bc607b0a6da50e82dc34e9601f4b508d08cc89ee7929"},
|
| 5163 |
+
{file = "yarl-1.18.0-cp311-cp311-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:205de377bd23365cd85562c9c6c33844050a93661640fda38e0567d2826b50df"},
|
| 5164 |
+
{file = "yarl-1.18.0-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:ed69af4fe2a0949b1ea1d012bf065c77b4c7822bad4737f17807af2adb15a73c"},
|
| 5165 |
+
{file = "yarl-1.18.0-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:8e1c18890091aa3cc8a77967943476b729dc2016f4cfe11e45d89b12519d4a93"},
|
| 5166 |
+
{file = "yarl-1.18.0-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:91b8fb9427e33f83ca2ba9501221ffaac1ecf0407f758c4d2f283c523da185ee"},
|
| 5167 |
+
{file = "yarl-1.18.0-cp311-cp311-musllinux_1_2_armv7l.whl", hash = "sha256:536a7a8a53b75b2e98ff96edb2dfb91a26b81c4fed82782035767db5a465be46"},
|
| 5168 |
+
{file = "yarl-1.18.0-cp311-cp311-musllinux_1_2_i686.whl", hash = "sha256:a64619a9c47c25582190af38e9eb382279ad42e1f06034f14d794670796016c0"},
|
| 5169 |
+
{file = "yarl-1.18.0-cp311-cp311-musllinux_1_2_ppc64le.whl", hash = "sha256:c73a6bbc97ba1b5a0c3c992ae93d721c395bdbb120492759b94cc1ac71bc6350"},
|
| 5170 |
+
{file = "yarl-1.18.0-cp311-cp311-musllinux_1_2_s390x.whl", hash = "sha256:a173401d7821a2a81c7b47d4e7d5c4021375a1441af0c58611c1957445055056"},
|
| 5171 |
+
{file = "yarl-1.18.0-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:7520e799b1f84e095cce919bd6c23c9d49472deeef25fe1ef960b04cca51c3fc"},
|
| 5172 |
+
{file = "yarl-1.18.0-cp311-cp311-win32.whl", hash = "sha256:c4cb992d8090d5ae5f7afa6754d7211c578be0c45f54d3d94f7781c495d56716"},
|
| 5173 |
+
{file = "yarl-1.18.0-cp311-cp311-win_amd64.whl", hash = "sha256:52c136f348605974c9b1c878addd6b7a60e3bf2245833e370862009b86fa4689"},
|
| 5174 |
+
{file = "yarl-1.18.0-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:1ece25e2251c28bab737bdf0519c88189b3dd9492dc086a1d77336d940c28ced"},
|
| 5175 |
+
{file = "yarl-1.18.0-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:454902dc1830d935c90b5b53c863ba2a98dcde0fbaa31ca2ed1ad33b2a7171c6"},
|
| 5176 |
+
{file = "yarl-1.18.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:01be8688fc211dc237e628fcc209dda412d35de7642453059a0553747018d075"},
|
| 5177 |
+
{file = "yarl-1.18.0-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:4d26f1fa9fa2167bb238f6f4b20218eb4e88dd3ef21bb8f97439fa6b5313e30d"},
|
| 5178 |
+
{file = "yarl-1.18.0-cp312-cp312-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:b234a4a9248a9f000b7a5dfe84b8cb6210ee5120ae70eb72a4dcbdb4c528f72f"},
|
| 5179 |
+
{file = "yarl-1.18.0-cp312-cp312-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:fe94d1de77c4cd8caff1bd5480e22342dbd54c93929f5943495d9c1e8abe9f42"},
|
| 5180 |
+
{file = "yarl-1.18.0-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:9b4c90c5363c6b0a54188122b61edb919c2cd1119684999d08cd5e538813a28e"},
|
| 5181 |
+
{file = "yarl-1.18.0-cp312-cp312-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:49a98ecadc5a241c9ba06de08127ee4796e1009555efd791bac514207862b43d"},
|
| 5182 |
+
{file = "yarl-1.18.0-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:9106025c7f261f9f5144f9aa7681d43867eed06349a7cfb297a1bc804de2f0d1"},
|
| 5183 |
+
{file = "yarl-1.18.0-cp312-cp312-musllinux_1_2_armv7l.whl", hash = "sha256:f275ede6199d0f1ed4ea5d55a7b7573ccd40d97aee7808559e1298fe6efc8dbd"},
|
| 5184 |
+
{file = "yarl-1.18.0-cp312-cp312-musllinux_1_2_i686.whl", hash = "sha256:f7edeb1dcc7f50a2c8e08b9dc13a413903b7817e72273f00878cb70e766bdb3b"},
|
| 5185 |
+
{file = "yarl-1.18.0-cp312-cp312-musllinux_1_2_ppc64le.whl", hash = "sha256:c083f6dd6951b86e484ebfc9c3524b49bcaa9c420cb4b2a78ef9f7a512bfcc85"},
|
| 5186 |
+
{file = "yarl-1.18.0-cp312-cp312-musllinux_1_2_s390x.whl", hash = "sha256:80741ec5b471fbdfb997821b2842c59660a1c930ceb42f8a84ba8ca0f25a66aa"},
|
| 5187 |
+
{file = "yarl-1.18.0-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:b1a3297b9cad594e1ff0c040d2881d7d3a74124a3c73e00c3c71526a1234a9f7"},
|
| 5188 |
+
{file = "yarl-1.18.0-cp312-cp312-win32.whl", hash = "sha256:cd6ab7d6776c186f544f893b45ee0c883542b35e8a493db74665d2e594d3ca75"},
|
| 5189 |
+
{file = "yarl-1.18.0-cp312-cp312-win_amd64.whl", hash = "sha256:039c299a0864d1f43c3e31570045635034ea7021db41bf4842693a72aca8df3a"},
|
| 5190 |
+
{file = "yarl-1.18.0-cp313-cp313-macosx_10_13_universal2.whl", hash = "sha256:6fb64dd45453225f57d82c4764818d7a205ee31ce193e9f0086e493916bd4f72"},
|
| 5191 |
+
{file = "yarl-1.18.0-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:3adaaf9c6b1b4fc258584f4443f24d775a2086aee82d1387e48a8b4f3d6aecf6"},
|
| 5192 |
+
{file = "yarl-1.18.0-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:da206d1ec78438a563c5429ab808a2b23ad7bc025c8adbf08540dde202be37d5"},
|
| 5193 |
+
{file = "yarl-1.18.0-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:576d258b21c1db4c6449b1c572c75d03f16a482eb380be8003682bdbe7db2f28"},
|
| 5194 |
+
{file = "yarl-1.18.0-cp313-cp313-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:c60e547c0a375c4bfcdd60eef82e7e0e8698bf84c239d715f5c1278a73050393"},
|
| 5195 |
+
{file = "yarl-1.18.0-cp313-cp313-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:e3818eabaefb90adeb5e0f62f047310079d426387991106d4fbf3519eec7d90a"},
|
| 5196 |
+
{file = "yarl-1.18.0-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:a5f72421246c21af6a92fbc8c13b6d4c5427dfd949049b937c3b731f2f9076bd"},
|
| 5197 |
+
{file = "yarl-1.18.0-cp313-cp313-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:7fa7d37f2ada0f42e0723632993ed422f2a679af0e200874d9d861720a54f53e"},
|
| 5198 |
+
{file = "yarl-1.18.0-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:42ba84e2ac26a3f252715f8ec17e6fdc0cbf95b9617c5367579fafcd7fba50eb"},
|
| 5199 |
+
{file = "yarl-1.18.0-cp313-cp313-musllinux_1_2_armv7l.whl", hash = "sha256:6a49ad0102c0f0ba839628d0bf45973c86ce7b590cdedf7540d5b1833ddc6f00"},
|
| 5200 |
+
{file = "yarl-1.18.0-cp313-cp313-musllinux_1_2_i686.whl", hash = "sha256:96404e8d5e1bbe36bdaa84ef89dc36f0e75939e060ca5cd45451aba01db02902"},
|
| 5201 |
+
{file = "yarl-1.18.0-cp313-cp313-musllinux_1_2_ppc64le.whl", hash = "sha256:a0509475d714df8f6d498935b3f307cd122c4ca76f7d426c7e1bb791bcd87eda"},
|
| 5202 |
+
{file = "yarl-1.18.0-cp313-cp313-musllinux_1_2_s390x.whl", hash = "sha256:1ff116f0285b5c8b3b9a2680aeca29a858b3b9e0402fc79fd850b32c2bcb9f8b"},
|
| 5203 |
+
{file = "yarl-1.18.0-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:e2580c1d7e66e6d29d6e11855e3b1c6381971e0edd9a5066e6c14d79bc8967af"},
|
| 5204 |
+
{file = "yarl-1.18.0-cp313-cp313-win32.whl", hash = "sha256:14408cc4d34e202caba7b5ac9cc84700e3421a9e2d1b157d744d101b061a4a88"},
|
| 5205 |
+
{file = "yarl-1.18.0-cp313-cp313-win_amd64.whl", hash = "sha256:1db1537e9cb846eb0ff206eac667f627794be8b71368c1ab3207ec7b6f8c5afc"},
|
| 5206 |
+
{file = "yarl-1.18.0-cp39-cp39-macosx_10_9_universal2.whl", hash = "sha256:fa2c9cb607e0f660d48c54a63de7a9b36fef62f6b8bd50ff592ce1137e73ac7d"},
|
| 5207 |
+
{file = "yarl-1.18.0-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:c0f4808644baf0a434a3442df5e0bedf8d05208f0719cedcd499e168b23bfdc4"},
|
| 5208 |
+
{file = "yarl-1.18.0-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:7db9584235895a1dffca17e1c634b13870852094f6389b68dcc6338086aa7b08"},
|
| 5209 |
+
{file = "yarl-1.18.0-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:309f8d27d6f93ceeeb80aa6980e883aa57895270f7f41842b92247e65d7aeddf"},
|
| 5210 |
+
{file = "yarl-1.18.0-cp39-cp39-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:609ffd44fed2ed88d9b4ef62ee860cf86446cf066333ad4ce4123505b819e581"},
|
| 5211 |
+
{file = "yarl-1.18.0-cp39-cp39-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:f172b8b2c72a13a06ea49225a9c47079549036ad1b34afa12d5491b881f5b993"},
|
| 5212 |
+
{file = "yarl-1.18.0-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:d89ae7de94631b60d468412c18290d358a9d805182373d804ec839978b120422"},
|
| 5213 |
+
{file = "yarl-1.18.0-cp39-cp39-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:466d31fd043ef9af822ee3f1df8fdff4e8c199a7f4012c2642006af240eade17"},
|
| 5214 |
+
{file = "yarl-1.18.0-cp39-cp39-musllinux_1_2_aarch64.whl", hash = "sha256:7609b8462351c4836b3edce4201acb6dd46187b207c589b30a87ffd1813b48dc"},
|
| 5215 |
+
{file = "yarl-1.18.0-cp39-cp39-musllinux_1_2_armv7l.whl", hash = "sha256:d9d4f5e471e8dc49b593a80766c2328257e405f943c56a3dc985c125732bc4cf"},
|
| 5216 |
+
{file = "yarl-1.18.0-cp39-cp39-musllinux_1_2_i686.whl", hash = "sha256:67b336c15e564d76869c9a21316f90edf546809a5796a083b8f57c845056bc01"},
|
| 5217 |
+
{file = "yarl-1.18.0-cp39-cp39-musllinux_1_2_ppc64le.whl", hash = "sha256:b212452b80cae26cb767aa045b051740e464c5129b7bd739c58fbb7deb339e7b"},
|
| 5218 |
+
{file = "yarl-1.18.0-cp39-cp39-musllinux_1_2_s390x.whl", hash = "sha256:38b39b7b3e692b6c92b986b00137a3891eddb66311b229d1940dcbd4f025083c"},
|
| 5219 |
+
{file = "yarl-1.18.0-cp39-cp39-musllinux_1_2_x86_64.whl", hash = "sha256:a7ee6884a8848792d58b854946b685521f41d8871afa65e0d4a774954e9c9e89"},
|
| 5220 |
+
{file = "yarl-1.18.0-cp39-cp39-win32.whl", hash = "sha256:b4095c5019bb889aa866bf12ed4c85c0daea5aafcb7c20d1519f02a1e738f07f"},
|
| 5221 |
+
{file = "yarl-1.18.0-cp39-cp39-win_amd64.whl", hash = "sha256:2d90f2e4d16a5b0915ee065218b435d2ef619dd228973b1b47d262a6f7cd8fa5"},
|
| 5222 |
+
{file = "yarl-1.18.0-py3-none-any.whl", hash = "sha256:dbf53db46f7cf176ee01d8d98c39381440776fcda13779d269a8ba664f69bec0"},
|
| 5223 |
+
{file = "yarl-1.18.0.tar.gz", hash = "sha256:20d95535e7d833889982bfe7cc321b7f63bf8879788fee982c76ae2b24cfb715"},
|
| 5224 |
]
|
| 5225 |
|
| 5226 |
[package.dependencies]
|
|
|
|
| 5231 |
[metadata]
|
| 5232 |
lock-version = "2.0"
|
| 5233 |
python-versions = "^3.10"
|
| 5234 |
+
content-hash = "4a5f7a6283c83d4d8397aac777fcccb9bb7622fe2f0a317baaf9553092b0259b"
|
pyproject.toml
CHANGED
|
@@ -34,7 +34,6 @@ ftfy = "^6.1.1"
|
|
| 34 |
texify = "^0.2.1"
|
| 35 |
rapidfuzz = "^3.8.1"
|
| 36 |
surya-ocr = { git = "https://github.com/VikParuchuri/surya.git", branch = "layout2" }
|
| 37 |
-
filetype = "^1.2.0"
|
| 38 |
regex = "^2024.4.28"
|
| 39 |
pdftext = "^0.3.19"
|
| 40 |
tabled-pdf = { git = "https://github.com/VikParuchuri/tabled.git", branch = "dev-mose/compilation-updates" }
|
|
|
|
| 34 |
texify = "^0.2.1"
|
| 35 |
rapidfuzz = "^3.8.1"
|
| 36 |
surya-ocr = { git = "https://github.com/VikParuchuri/surya.git", branch = "layout2" }
|
|
|
|
| 37 |
regex = "^2024.4.28"
|
| 38 |
pdftext = "^0.3.19"
|
| 39 |
tabled-pdf = { git = "https://github.com/VikParuchuri/tabled.git", branch = "dev-mose/compilation-updates" }
|
tests/conftest.py
CHANGED
|
@@ -12,13 +12,6 @@ from marker.converters.pdf import PdfConverter
|
|
| 12 |
from marker.models import setup_detection_model, setup_layout_model, \
|
| 13 |
setup_recognition_model, setup_table_rec_model, \
|
| 14 |
setup_texify_model
|
| 15 |
-
from marker.processors.code import CodeProcessor
|
| 16 |
-
from marker.processors.debug import DebugProcessor
|
| 17 |
-
from marker.processors.document_toc import DocumentTOCProcessor
|
| 18 |
-
from marker.processors.equation import EquationProcessor
|
| 19 |
-
from marker.processors.sectionheader import SectionHeaderProcessor
|
| 20 |
-
from marker.processors.table import TableProcessor
|
| 21 |
-
from marker.processors.text import TextProcessor
|
| 22 |
from marker.schema import BlockTypes
|
| 23 |
from marker.schema.blocks import Block
|
| 24 |
from marker.renderers.markdown import MarkdownRenderer
|
|
@@ -111,18 +104,9 @@ def pdf_converter(request, config, layout_model, texify_model, recognition_model
|
|
| 111 |
"table_rec_model": table_rec_model,
|
| 112 |
"detection_model": detection_model
|
| 113 |
}
|
| 114 |
-
processor_list = [
|
| 115 |
-
EquationProcessor,
|
| 116 |
-
TableProcessor,
|
| 117 |
-
SectionHeaderProcessor,
|
| 118 |
-
TextProcessor,
|
| 119 |
-
CodeProcessor,
|
| 120 |
-
DocumentTOCProcessor,
|
| 121 |
-
DebugProcessor,
|
| 122 |
-
]
|
| 123 |
yield PdfConverter(
|
| 124 |
artifact_dict=model_dict,
|
| 125 |
-
processor_list=
|
| 126 |
renderer=classes_to_strings([renderer])[0],
|
| 127 |
config=config
|
| 128 |
)
|
|
|
|
| 12 |
from marker.models import setup_detection_model, setup_layout_model, \
|
| 13 |
setup_recognition_model, setup_table_rec_model, \
|
| 14 |
setup_texify_model
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 15 |
from marker.schema import BlockTypes
|
| 16 |
from marker.schema.blocks import Block
|
| 17 |
from marker.renderers.markdown import MarkdownRenderer
|
|
|
|
| 104 |
"table_rec_model": table_rec_model,
|
| 105 |
"detection_model": detection_model
|
| 106 |
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 107 |
yield PdfConverter(
|
| 108 |
artifact_dict=model_dict,
|
| 109 |
+
processor_list=None,
|
| 110 |
renderer=classes_to_strings([renderer])[0],
|
| 111 |
config=config
|
| 112 |
)
|
tests/processors/test_ignoretext.py
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
import pytest
|
| 2 |
+
|
| 3 |
+
from marker.processors.ignoretext import IgnoreTextProcessor
|
| 4 |
+
from marker.schema import BlockTypes
|
| 5 |
+
|
| 6 |
+
|
| 7 |
+
@pytest.mark.filename("bio_pdf.pdf")
|
| 8 |
+
@pytest.mark.config({"page_range": list(range(6))})
|
| 9 |
+
@pytest.mark.skip(reason="Need to wait for layout model to stabilize before activating.")
|
| 10 |
+
def test_ignoretext_processor(pdf_document):
|
| 11 |
+
processor = IgnoreTextProcessor()
|
| 12 |
+
processor(pdf_document)
|
| 13 |
+
|
| 14 |
+
page0_header = pdf_document.pages[0].contained_blocks(pdf_document, [BlockTypes.Text])[0]
|
| 15 |
+
assert "bioRxiv" in page0_header.raw_text(pdf_document)
|
| 16 |
+
breakpoint()
|
| 17 |
+
|
| 18 |
+
first_span = page0_header.contained_blocks(pdf_document, [BlockTypes.Span])[0]
|
| 19 |
+
assert first_span.ignore_for_output is True
|