From 2f7edeb684f05c782a5bc986a363c09059b04d8b Mon Sep 17 00:00:00 2001 From: Saidgurbuz Date: Tue, 20 May 2025 11:33:47 +0200 Subject: [PATCH] update load_from_doctags usage Signed-off-by: Saidgurbuz --- docling_eval/evaluators/adapters.py | 3 +-- docling_eval/evaluators/base_evaluator.py | 3 +-- docling_eval/prediction_providers/file_provider.py | 5 +++-- 3 files changed, 5 insertions(+), 6 deletions(-) diff --git a/docling_eval/evaluators/adapters.py b/docling_eval/evaluators/adapters.py index 81d6e47f..78a1b9f8 100644 --- a/docling_eval/evaluators/adapters.py +++ b/docling_eval/evaluators/adapters.py @@ -60,6 +60,5 @@ def _doctags_to_doc(self, doc_id, doctags: str) -> DoclingDocument: """ doctags_page = DocTagsPage(tokens=doctags) doctags_doc = DocTagsDocument(pages=[doctags_page]) - doc = DoclingDocument(name=doc_id) - doc.load_from_doctags(doctags_doc) + doc = DoclingDocument.load_from_doctags(doctags_doc, document_name=doc_id) return doc diff --git a/docling_eval/evaluators/base_evaluator.py b/docling_eval/evaluators/base_evaluator.py index 19664eda..940f6bc5 100644 --- a/docling_eval/evaluators/base_evaluator.py +++ b/docling_eval/evaluators/base_evaluator.py @@ -56,8 +56,7 @@ def docling_document_from_doctags( doctags_page = DocTagsPage(tokens=doctags, image=page_image) doctags_doc = DocTagsDocument(pages=[doctags_page]) - pred_doc = DoclingDocument(name=doc_id) - pred_doc.load_from_doctags(doctags_doc) + pred_doc = DoclingDocument.load_from_doctags(doctags_doc, document_name=doc_id) return pred_doc diff --git a/docling_eval/prediction_providers/file_provider.py b/docling_eval/prediction_providers/file_provider.py index 1d91f6b3..79eed286 100644 --- a/docling_eval/prediction_providers/file_provider.py +++ b/docling_eval/prediction_providers/file_provider.py @@ -180,8 +180,9 @@ def _load_doctags_doc(self, record: DatasetRecord) -> Optional[DoclingDocument]: # Build DoclingDocument doctags_page = DocTagsPage(tokens=doctags, image=page_image) doctags_doc = DocTagsDocument(pages=[doctags_page]) - doc = DoclingDocument(name=record.doc_id) - doc.load_from_doctags(doctags_doc) + doc = DoclingDocument.load_from_doctags( + doctags_doc, document_name=record.doc_id + ) return doc except Exception as e: