style: Format code with ruff

- Format 5 files affected by PDF scraper changes
- Ensures CI/CD code quality checks pass

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
This commit is contained in:
yusyus
2026-01-27 21:08:05 +03:00
parent 3fc4b54164
commit 8f720670f2
5 changed files with 33 additions and 16 deletions

View File

@@ -794,7 +794,12 @@ class PDFExtractor:
markdown = page.get_text("markdown")
except (AssertionError, ValueError):
# Fallback to text format for older/newer PyMuDF versions
markdown = page.get_text("text", flags=fitz.TEXT_PRESERVE_WHITESPACE | fitz.TEXT_PRESERVE_LIGATURES | fitz.TEXT_PRESERVE_SPANS)
markdown = page.get_text(
"text",
flags=fitz.TEXT_PRESERVE_WHITESPACE
| fitz.TEXT_PRESERVE_LIGATURES
| fitz.TEXT_PRESERVE_SPANS,
)
# Extract tables (Priority 2)
tables = self.extract_tables_from_page(page)