From 25460cdbe5815d347112e88a57566a22eec6e488 Mon Sep 17 00:00:00 2001 From: invoker Date: Wed, 12 Apr 2023 13:15:13 +0800 Subject: [PATCH 1/3] fix [Errno 13] Permission denied in windows --- pipelines/pipelines/nodes/file_converter/pdf.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/pipelines/pipelines/nodes/file_converter/pdf.py b/pipelines/pipelines/nodes/file_converter/pdf.py index 88c61f365fe1..670335a67c42 100644 --- a/pipelines/pipelines/nodes/file_converter/pdf.py +++ b/pipelines/pipelines/nodes/file_converter/pdf.py @@ -209,9 +209,11 @@ def convert( try: images = convert_from_path(file_path) for image in images: - temp_img = tempfile.NamedTemporaryFile(dir=os.path.dirname(os.path.realpath(__file__)), suffix=".jpeg") + temp_img = tempfile.NamedTemporaryFile(dir=os.path.dirname(os.path.realpath(__file__)), suffix=".jpeg", delete=False) image.save(temp_img.name) pages.append(self.image_2_text.convert(temp_img.name)[0]["content"]) + temp_img.close() + os.remove(temp_img.name) except Exception as exception: logger.error(f"File {file_path} has an error \n {exception}") From e5b61cd0c15f458b40f3ddd9b554b54bdcab5a35 Mon Sep 17 00:00:00 2001 From: invoker Date: Wed, 12 Apr 2023 14:22:39 +0800 Subject: [PATCH 2/3] formatting code --- pipelines/pipelines/nodes/file_converter/pdf.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/pipelines/pipelines/nodes/file_converter/pdf.py b/pipelines/pipelines/nodes/file_converter/pdf.py index 670335a67c42..66341d9e87dc 100644 --- a/pipelines/pipelines/nodes/file_converter/pdf.py +++ b/pipelines/pipelines/nodes/file_converter/pdf.py @@ -209,7 +209,8 @@ def convert( try: images = convert_from_path(file_path) for image in images: - temp_img = tempfile.NamedTemporaryFile(dir=os.path.dirname(os.path.realpath(__file__)), suffix=".jpeg", delete=False) + temp_img = tempfile.NamedTemporaryFile(dir=os.path.dirname(os.path.realpath(__file__)), suffix=".jpeg", + delete=False) image.save(temp_img.name) pages.append(self.image_2_text.convert(temp_img.name)[0]["content"]) temp_img.close() From 0f8a0920266360d8bb732b06c16b9957773dc1a6 Mon Sep 17 00:00:00 2001 From: invoker Date: Thu, 13 Apr 2023 11:19:28 +0800 Subject: [PATCH 3/3] formatting code --- pipelines/pipelines/nodes/file_converter/pdf.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/pipelines/pipelines/nodes/file_converter/pdf.py b/pipelines/pipelines/nodes/file_converter/pdf.py index 66341d9e87dc..874da76169c9 100644 --- a/pipelines/pipelines/nodes/file_converter/pdf.py +++ b/pipelines/pipelines/nodes/file_converter/pdf.py @@ -209,8 +209,9 @@ def convert( try: images = convert_from_path(file_path) for image in images: - temp_img = tempfile.NamedTemporaryFile(dir=os.path.dirname(os.path.realpath(__file__)), suffix=".jpeg", - delete=False) + temp_img = tempfile.NamedTemporaryFile( + dir=os.path.dirname(os.path.realpath(__file__)), suffix=".jpeg", delete=False + ) image.save(temp_img.name) pages.append(self.image_2_text.convert(temp_img.name)[0]["content"]) temp_img.close()