Skip to content

Commit bb02358

Browse files
chore(deps): lock file maintenance (#1188)
Co-authored-by: renovate[bot] <29139614+renovate[bot]@users.noreply.github.com> Co-authored-by: James Braza <jamesbraza@gmail.com>
1 parent 607b350 commit bb02358

File tree

5 files changed

+3871
-3537
lines changed

5 files changed

+3871
-3537
lines changed

packages/paper-qa-docling/pyproject.toml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -36,6 +36,7 @@ requires-python = ">=3.11"
3636

3737
[project.optional-dependencies]
3838
dev = [
39+
"docling-ibm-models[opencv-python-headless]>=3.10.0", # Lower pin and specify opencv after https://github.com/docling-project/docling-ibm-models/pull/130
3940
"docling>=2.56", # Pin for EasyOCR deprecation
4041
"fhlmi>=0.39", # Pin for bytes_to_string
4142
"paper-qa>=5.23", # Pin for PDFParserFn

packages/paper-qa-docling/tests/test_paperqa_docling.py

Lines changed: 9 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -241,11 +241,19 @@ def test_table_parsing() -> None:
241241
IN_GITHUB_ACTIONS: bool = os.getenv("GITHUB_ACTIONS") == "true"
242242

243243

244+
@pytest.mark.xfail(
245+
reason=(
246+
"Docling not respecting document_timeout,"
247+
" SEE: https://github.com/docling-project/docling/issues/2610"
248+
),
249+
raises=pytest.fail.Exception,
250+
)
244251
def test_document_timeout_denial() -> None:
245252
tic = time.perf_counter()
246253
with pytest.raises(ImpossibleParsingError, match="partial"):
247254
parse_pdf_to_pages(
248-
STUB_DATA_DIR / "pasa.pdf", custom_pipeline_options={"document_timeout": 1}
255+
STUB_DATA_DIR / "pasa.pdf",
256+
custom_pipeline_options={"document_timeout": 1},
249257
)
250258
if not IN_GITHUB_ACTIONS: # GitHub Actions runners are too noisy in timing
251259
# On 10/3/2025 on a MacBook M3 Pro with 36-GB RAM, reading PaSa took 18.7-sec

packages/paper-qa-pymupdf/tests/test_paperqa_pymupdf.py

Lines changed: 20 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -238,11 +238,23 @@ def custom_to_markdown(self, clean=False, fill_empty=True) -> str:
238238
), "Expected a few tables to be parsed for assertions to work"
239239
zeroth_media, *_ = next(iter(all_tables.values()))
240240
assert zeroth_media.text is None, "Expected null byte to be filtered"
241-
assert zeroth_raw_table_text == (
242-
"|Gap Size (mm)|Ununited|Uncertain|United|"
243-
"\n|---|---|---|---|"
244-
"\n|**1.0**|1/5 (20%)|1/5 (20%)|3/5 (60%)|"
245-
"\n|**1.5**|3/7 (43%)|2/7 (29%)|2/7 (29%)|"
246-
"\n|**2.0** <br>|3/6 (50%)|2/6 (33%)|1/6 (17%)|"
247-
"\n\n" # NOTE: this is before strip, so there can be trailing whitespace
248-
)
241+
try:
242+
# Seen with pymupdf==1.26.6
243+
assert zeroth_raw_table_text == (
244+
"|Gap Size (mm)|Ununited|Uncertain|United|"
245+
"\n|---|---|---|---|"
246+
"\n|**1.0**|1/5(20%)|1/5(20%)|3/5(60%)|"
247+
"\n|**1.5**|3/7(43%)|2/7(29%)|2/7(29%)|"
248+
"\n|**2.0**|3/6(50%)|2/6(33%)|1/6(17%)|"
249+
"\n\n" # NOTE: this is before strip, so there can be trailing whitespace
250+
)
251+
except AssertionError:
252+
# Seen with pymupdf==1.26.5
253+
assert zeroth_raw_table_text == (
254+
"|Gap Size (mm)|Ununited|Uncertain|United|"
255+
"\n|---|---|---|---|"
256+
"\n|**1.0**|1/5 (20%)|1/5 (20%)|3/5 (60%)|"
257+
"\n|**1.5**|3/7 (43%)|2/7 (29%)|2/7 (29%)|"
258+
"\n|**2.0** <br>|3/6 (50%)|2/6 (33%)|1/6 (17%)|"
259+
"\n\n" # NOTE: this is before strip, so there can be trailing whitespace
260+
)

tests/cassettes/test_get_reasoning[openrouter-deepseek].yaml

Lines changed: 2861 additions & 2836 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

0 commit comments

Comments
 (0)