Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 4 additions & 0 deletions context_chat_backend/chain/ingest/doc_loader.py
Original file line number Diff line number Diff line change
Expand Up @@ -16,6 +16,7 @@
from odfdo import Document
from pandas import read_csv, read_excel
from pypdf import PdfReader
from pypdf.errors import FileNotDecryptedError as PdfFileNotDecryptedError
from striprtf import striprtf

logger = logging.getLogger('ccb.doc_loader')
Expand Down Expand Up @@ -133,6 +134,9 @@ def decode_source(source: UploadFile) -> str | None:
result = source.file.read().decode('utf-8', 'ignore')
source.file.close()
return result
except PdfFileNotDecryptedError:
logger.warning(f'PDF file ({source.filename}) is encrypted and cannot be read')
return None
except Exception:
logger.exception(f'Error decoding source file ({source.filename})', stack_info=True)
return None
Expand Down
1 change: 1 addition & 0 deletions requirements.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,6 @@
apscheduler
chromadb
cryptography
ctransformers
epub2txt
fastapi
Expand Down
Loading