Skip to content

Commit

Permalink
Fix PDFs unit test, skip OCR
Browse files Browse the repository at this point in the history
  • Loading branch information
sabaimran committed Oct 21, 2024
1 parent 59fec37 commit ad197be
Showing 1 changed file with 3 additions and 0 deletions.
3 changes: 3 additions & 0 deletions tests/test_pdf_to_entries.py
Original file line number Diff line number Diff line change
@@ -1,6 +1,8 @@
import os
import re

import pytest

from khoj.processor.content.pdf.pdf_to_entries import PdfToEntries
from khoj.utils.fs_syncer import get_pdf_files
from khoj.utils.rawconfig import TextContentConfig
Expand Down Expand Up @@ -37,6 +39,7 @@ def test_multi_page_pdf_to_jsonl():
assert len(entries[1]) == 6


@pytest.mark.skip(reason="Temporarily disabled OCR due to performance issues")
def test_ocr_page_pdf_to_jsonl():
"Convert multiple pages from single PDF file to jsonl."
# Arrange
Expand Down

0 comments on commit ad197be

Please sign in to comment.